diff --git a/ia-legacy-importer/README b/ia-legacy-importer/README
new file mode 100644
index 00000000..c6128a01
--- /dev/null
+++ b/ia-legacy-importer/README
@@ -0,0 +1,21 @@
+INSTALLATION
+
+you need python2.4, and, to import MARC catalogs, whatever
+is required by catalog/marc/marc8_to_utf8.pl, including
+this:
+
+http://search.cpan.org/dist/MARC-Charset/
+
+you can test that the script is in basic working order by
+running test-marc8_to_utf8.sh while in that directory.
+
+HOW TO IMPORT CATALOG DATA
+
+CATALOG=(this directory)
+SOURCE_DATA=(path to data)
+> cp $CATALOG/config-example.sh $MYDIR/config.sh
+> # edit $MYDIR/config.sh
+> $CATALOG/import.sh $MYDIR/config.sh "marc" "LC" "marc_records_scriblio_net/part01.dat" <$SOURCE_DATA
+
+see import.sh for details.
+
diff --git a/ia-legacy-importer/__init__.py b/ia-legacy-importer/__init__.py
new file mode 100644
index 00000000..0216b77d
--- /dev/null
+++ b/ia-legacy-importer/__init__.py
@@ -0,0 +1 @@
+"""catalog"""
diff --git a/ia-legacy-importer/add_book/__init__.py b/ia-legacy-importer/add_book/__init__.py
new file mode 100644
index 00000000..c9ec4e9c
--- /dev/null
+++ b/ia-legacy-importer/add_book/__init__.py
@@ -0,0 +1,748 @@
+"""Module to load books into Open Library.
+
+This is used to load books from various MARC sources, including
+Internet Archive.
+
+For loading a book, the available metadata is compiled as a dict,
+called a record internally. Here is a sample record:
+
+    {
+        "title": "The Adventures of Tom Sawyer",
+        "source_records": ["ia:TheAdventuresOfTomSawyer_201303"],
+        "authors": [{
+            "name": "Mark Twain"
+        }]
+    }
+
+The title and source_records fields are mandatory.
+
+A record is loaded by calling the load function.
+
+    record = {...}
+    response = load(record)
+
+"""
+import json
+import re
+import six
+from six.moves import urllib
+import unicodedata
+import web
+
+from collections import defaultdict
+from copy import copy
+from time import sleep
+
+from infogami import config
+
+from openlibrary import accounts
+from openlibrary.catalog.merge.merge_marc import build_marc
+from openlibrary.catalog.utils import mk_norm
+from openlibrary.core import lending
+from openlibrary.utils.isbn import normalize_isbn
+
+from openlibrary.catalog.add_book.load_book import build_query, east_in_by_statement, import_author, InvalidLanguage
+from openlibrary.catalog.add_book.merge import try_merge
+
+
+re_normalize = re.compile('[^[:alphanum:] ]', re.U)
+re_lang = re.compile('^/languages/([a-z]{3})$')
+
+
+type_map = {
+    'description': 'text',
+    'notes': 'text',
+    'number_of_pages': 'int',
+}
+
+
+class CoverNotSaved(Exception):
+    def __init__(self, f):
+        self.f = f
+    def __str__(self):
+        return "coverstore responded with: '%s'" % self.f
+
+
+class RequiredField(Exception):
+    def __init__(self, f):
+        self.f = f
+    def __str__(self):
+        return "missing required field: %s" % self.f
+
+
+# don't use any of these as work titles
+bad_titles = set(('Publications', 'Works. English', 'Missal', 'Works', 'Report', \
+    'Letters', 'Calendar', 'Bulletin', 'Plays', 'Sermons', 'Correspondence', \
+    'Bill', 'Bills', 'Selections', 'Selected works', 'Selected works. English', \
+    'The Novels', 'Laws, etc'))
+
+subject_fields = ['subjects', 'subject_places', 'subject_times', 'subject_people' ]
+
+
+def strip_accents(s):
+    """http://stackoverflow.com/questions/517923/what-is-the-best-way-to-remove-accents-in-a-python-unicode-string
+    """
+    if isinstance(s, str):
+        return s
+    assert isinstance(s, six.text_type)
+    return ''.join((c for c in unicodedata.normalize('NFD', s) if unicodedata.category(c) != 'Mn'))
+
+
+def normalize(s): # strip non-alphanums and truncate at 25 chars
+    norm = strip_accents(s).lower()
+    norm = norm.replace(' and ', ' ')
+    if norm.startswith('the '):
+        norm = norm[4:]
+    elif norm.startswith('a '):
+        norm = norm[2:]
+    # strip bracketed text
+    norm = re.sub(r' ?\(.*\)', '', norm)
+    return norm.replace(' ', '')[:25]
+
+
+def is_redirect(thing):
+    """
+    :param Thing thing:
+    :rtype: bool
+    """
+    if not thing:
+        return False
+    return thing.type.key == '/type/redirect'
+
+
+def get_title(e):
+    if not e.get('work_titles'):
+        return e['title']
+    wt = e['work_titles'][0]
+    return e['title'] if wt in bad_titles else e['title']
+
+
+def find_matching_work(e):
+    """
+    Looks for an existing Work representing the new import edition by
+    comparing normalized titles for every work by each author of the current edition.
+    Returns the first match found, or None.
+
+    :param dict e: An OL edition suitable for saving, has a key, and has full Authors with keys
+                   but has not yet been saved.
+    :rtype: None or str
+    :return: the matched work key "/works/OL..W" if found
+    """
+
+    norm_title = mk_norm(get_title(e))
+    seen = set()
+    for a in e['authors']:
+        q = {
+            'type': '/type/work',
+            'authors': {'author': {'key': a['key']}}
+        }
+        work_keys = list(web.ctx.site.things(q))
+        for wkey in work_keys:
+            w = web.ctx.site.get(wkey)
+            if wkey in seen:
+                continue
+            seen.add(wkey)
+            if not w.get('title'):
+                continue
+            if mk_norm(w['title']) == norm_title:
+                assert w.type.key == '/type/work'
+                return wkey
+
+
+def build_author_reply(author_in, edits):
+    """
+    Steps through an import record's authors, and creates new records if new,
+    adding them to 'edits' to be saved later.
+
+    :param list author_in: List of import sourced author dicts [{"name:" "Some One"}, ...], possibly with dates
+    :param list edits: list of Things to be saved later. Is modfied by this method.
+    :rtype: tuple
+    :return: (list, list) authors [{"key": "/author/OL..A"}, ...], author_reply the JSON status response to return for each author
+    """
+
+    authors = []
+    author_reply = []
+    for a in author_in:
+        new_author = 'key' not in a
+        if new_author:
+            a['key'] = web.ctx.site.new_key('/type/author')
+            edits.append(a)
+        authors.append({'key': a['key']})
+        author_reply.append({
+            'key': a['key'],
+            'name': a['name'],
+            'status': ('created' if new_author else 'matched'),
+        })
+    return (authors, author_reply)
+
+
+def new_work(edition, rec, cover_id=None):
+    """
+    :param dict edition: New OL Edition
+    :param dict rec: Edition import data
+    :param (int|None) cover_id: cover id
+    :rtype: dict
+    :return: a work to save
+    """
+    w = {
+        'type': {'key': '/type/work'},
+        'title': get_title(rec),
+    }
+    for s in subject_fields:
+        if s in rec:
+            w[s] = rec[s]
+
+    if 'authors' in edition:
+        w['authors'] = [{'type':{'key': '/type/author_role'}, 'author': akey} for akey in edition['authors']]
+
+    if 'description' in rec:
+        w['description'] = {'type': '/type/text', 'value': rec['description']}
+
+    wkey = web.ctx.site.new_key('/type/work')
+    if edition.get('covers'):
+        w['covers'] = edition['covers']
+    w['key'] = wkey
+    return w
+
+
+def add_cover(cover_url, ekey, account=None):
+    """
+    Adds a cover to coverstore and returns the cover id.
+
+    :param str cover_url: URL of cover image
+    :param str ekey: Edition key /book/OL..M
+    :rtype: int or None
+    :return: Cover id, or None if upload did not succeed
+    """
+    olid = ekey.split("/")[-1]
+    coverstore_url = config.get('coverstore_url').rstrip('/')
+    upload_url = coverstore_url + '/b/upload2'
+    if upload_url.startswith("//"):
+        upload_url = "{0}:{1}".format(web.ctx.get("protocol", "http"), upload_url)
+    user = account or accounts.get_current_user()
+    params = {
+        'author': user.get('key') or user.get('_key'),
+        'data': None,
+        'source_url': cover_url,
+        'olid': olid,
+        'ip': web.ctx.ip,
+    }
+    reply = None
+    for attempt in range(10):
+        try:
+            res = urllib.request.urlopen(upload_url, urllib.parse.urlencode(params))
+        except IOError:
+            sleep(2)
+            continue
+        body = res.read()
+        if res.getcode() == 500:
+            raise CoverNotSaved(body)
+        if body not in ['', 'None']:
+            reply = json.loads(body)
+            if res.getcode() == 200 and 'id' in reply:
+                break
+        sleep(2)
+    if not reply or reply.get('message') == 'Invalid URL':
+        return
+    cover_id = int(reply['id'])
+    return cover_id
+
+def get_ia_item(ocaid):
+    import internetarchive as ia
+    cfg = {'general': {'secure': False}}
+    item = ia.get_item(ocaid, config=cfg)
+    return item
+
+def modify_ia_item(item, data):
+    access_key = lending.config_ia_ol_metadata_write_s3 and lending.config_ia_ol_metadata_write_s3['s3_key']
+    secret_key = lending.config_ia_ol_metadata_write_s3 and lending.config_ia_ol_metadata_write_s3['s3_secret']
+    return item.modify_metadata(data, access_key=access_key, secret_key=secret_key)
+
+def create_ol_subjects_for_ocaid(ocaid, subjects):
+    item = get_ia_item(ocaid)
+    openlibrary_subjects = copy(item.metadata.get('openlibrary_subject')) or []
+
+    if not isinstance(openlibrary_subjects, list):
+        openlibrary_subjects = [openlibrary_subjects]
+
+    for subject in subjects:
+        if subject not in openlibrary_subjects:
+            openlibrary_subjects.append(subject)
+
+    r = modify_ia_item(item, {'openlibrary_subject': openlibrary_subjects})
+    if r.status_code != 200:
+        return ('%s failed: %s' % (item.identifier, r.content))
+    else:
+        return ("success for %s" % item.identifier)
+
+def update_ia_metadata_for_ol_edition(edition_id):
+    """
+    Writes the Open Library Edition and Work id to a linked
+    archive.org item.
+
+    :param str edition_id: of the form OL..M
+    :rtype: dict
+    :return: error report, or modified archive.org metadata on success
+    """
+
+    data = {'error': 'No qualifying edition'}
+    if edition_id:
+        ed = web.ctx.site.get('/books/%s' % edition_id)
+        if ed.ocaid:
+            work = ed.works[0] if ed.get('works') else None
+            if work and work.key:
+                item = get_ia_item(ed.ocaid)
+                work_id = work.key.split('/')[2]
+                r = modify_ia_item(item, {
+                    'openlibrary_work': work_id,
+                    'openlibrary_edition': edition_id
+                })
+                if r.status_code != 200:
+                    data = {'error': '%s failed: %s' % (item.identifier, r.content)}
+                else:
+                    data = item.metadata
+    return data
+
+
+def normalize_record_isbns(rec):
+    """
+    Returns the Edition import record with all ISBN fields cleaned.
+
+    :param dict rec: Edition import record
+    :rtype: dict
+    :return: A record with cleaned ISBNs in the various possible ISBN locations.
+    """
+    for field in ('isbn_13', 'isbn_10', 'isbn'):
+        if rec.get(field):
+            rec[field] = [normalize_isbn(isbn) for isbn in rec.get(field) if normalize_isbn(isbn)]
+    return rec
+
+
+def isbns_from_record(rec):
+    """
+    Returns a list of all isbns from the various possible isbn fields.
+
+    :param dict rec: Edition import record
+    :rtype: list
+    """
+    isbns = rec.get('isbn', []) + rec.get('isbn_10', []) + rec.get('isbn_13', [])
+    return isbns
+
+
+def build_pool(rec):
+    """
+    Searches for existing edition matches on title and bibliographic keys.
+
+    :param dict rec: Edition record
+    :rtype: dict
+    :return: {<identifier: title | isbn | lccn etc>: [list of /books/OL..M keys that match rec on <identifier>]}
+    """
+    pool = defaultdict(set)
+    match_fields = ('title', 'oclc_numbers', 'lccn', 'ocaid')
+
+    # Find records with matching fields
+    for field in match_fields:
+        pool[field] = set(editions_matched(rec, field))
+
+    # update title pool with normalized title matches
+    pool['title'].update(set(editions_matched(rec, 'normalized_title_', normalize(rec['title']))))
+
+    # Find records with matching ISBNs
+    isbns = isbns_from_record(rec)
+    if isbns:
+        pool['isbn'] = set(editions_matched(rec, 'isbn_', isbns))
+
+    return dict((k, list(v)) for k, v in pool.iteritems() if v)
+
+
+def early_exit(rec):
+    """
+    Attempts to quickly find an existing item match using bibliographic keys.
+
+    :param dict rec: Edition record
+    :rtype: str|bool
+    :return: First key matched of format "/books/OL..M" or False if no match found.
+    """
+
+    if 'openlibrary' in rec:
+        return '/books/' + rec['openlibrary']
+
+    ekeys = editions_matched(rec, 'ocaid')
+    if ekeys:
+        return ekeys[0]
+
+    isbns = isbns_from_record(rec)
+    if isbns:
+        ekeys = editions_matched(rec, 'isbn_', isbns)
+        if ekeys:
+            return ekeys[0]
+
+    # only searches for the first value from these lists
+    for f in 'source_records', 'oclc_numbers', 'lccn':
+        if rec.get(f):
+            ekeys = editions_matched(rec, f, rec[f][0])
+            if ekeys:
+                return ekeys[0]
+    return False
+
+
+def editions_matched(rec, key, value=None):
+    """
+    Search OL for editions matching record's 'key' value.
+
+    :param dict rec: Edition import record
+    :param str key: Key to search on, e.g. 'isbn_'
+    :param list|str value: Value or Values to use, overriding record values
+    :rtpye: list
+    :return: List of edition keys ["/books/OL..M",]
+    """
+    if value is None and key not in rec:
+        return []
+
+    if value is None:
+        value = rec[key]
+    q = {
+        'type':'/type/edition',
+        key: value
+    }
+    ekeys = list(web.ctx.site.things(q))
+    return ekeys
+
+
+def find_exact_match(rec, edition_pool):
+    """
+    Returns an edition key match for rec from edition_pool
+    Only returns a key if all values match?
+
+    :param dict rec: Edition import record
+    :param dict edition_pool:
+    :rtype: str|bool
+    :return: edition key
+    """
+    seen = set()
+    for field, editions in edition_pool.iteritems():
+        for ekey in editions:
+            if ekey in seen:
+                continue
+            seen.add(ekey)
+            existing = web.ctx.site.get(ekey)
+            match = True
+            for k, v in rec.items():
+                if k == 'source_records':
+                    continue
+                existing_value = existing.get(k)
+                if not existing_value:
+                    continue
+                if k == 'languages':
+                     existing_value = [str(re_lang.match(l.key).group(1)) for l in existing_value]
+                if k == 'authors':
+                     existing_value = [dict(a) for a in existing_value]
+                     for a in existing_value:
+                         del a['type']
+                         del a['key']
+                     for a in v:
+                        if 'entity_type' in a:
+                            del a['entity_type']
+                        if 'db_name' in a:
+                            del a['db_name']
+
+                if existing_value != v:
+                    match = False
+                    break
+            if match:
+                return ekey
+    return False
+
+
+def find_match(e1, edition_pool):
+    """
+    Find the best match for e1 in edition_pool and return its key.
+    :param dict e1: the new edition we are trying to match, output of build_marc(import record)
+    :param list edition_pool: list of possible edition matches, output of build_pool(import record)
+    :rtype: str|None
+    :return: None or the edition key '/books/OL...M' of the best edition match for e1 in edition_pool
+    """
+    seen = set()
+    for k, v in edition_pool.iteritems():
+        for edition_key in v:
+            if edition_key in seen:
+                continue
+            thing = None
+            found = True
+            while not thing or is_redirect(thing):
+                seen.add(edition_key)
+                thing = web.ctx.site.get(edition_key)
+                if thing is None:
+                    found = False
+                    break
+                if is_redirect(thing):
+                    edition_key = thing['location']
+                    # FIXME: this updates edition_key, but leaves thing as redirect,
+                    # which will raise an exception in try_merge()
+            if not found:
+                continue
+            if try_merge(e1, edition_key, thing):
+                return edition_key
+
+
+def add_db_name(rec):
+    """
+    db_name = Author name followed by dates.
+    adds 'db_name' in place for each author.
+    """
+    if 'authors' not in rec:
+        return
+
+    for a in rec['authors']:
+        date = None
+        if 'date' in a:
+            assert 'birth_date' not in a and 'death_date' not in a
+            date = a['date']
+        elif 'birth_date' in a or 'death_date' in a:
+            date = a.get('birth_date', '') + '-' + a.get('death_date', '')
+        a['db_name'] = ' '.join([a['name'], date]) if date else a['name']
+
+
+def load_data(rec, account=None):
+    """
+    Adds a new Edition to Open Library. Checks for existing Works.
+    Creates a new Work, and Author, if required,
+    otherwise associates the new Edition with the existing Work.
+
+    :param dict rec: Edition record to add (no further checks at this point)
+    :rtype: dict
+    :return:
+        {
+            "success": False,
+            "error": <error msg>
+        }
+      OR
+        {
+            "success": True,
+            "work": {"key": <key>, "status": "created" | "modified" | "matched"},
+            "edition": {"key": <key>, "status": "created"},
+            "authors": [{"status": "matched", "name": "John Smith", "key": <key>}, ...]
+        }
+    """
+
+    cover_url = None
+    if 'cover' in rec:
+        cover_url = rec['cover']
+        del rec['cover']
+    try:
+        # get an OL style edition dict
+        edition = build_query(rec)
+    except InvalidLanguage as e:
+        return {
+            'success': False,
+            'error': str(e),
+        }
+
+    ekey = web.ctx.site.new_key('/type/edition')
+    cover_id = None
+    if cover_url:
+        cover_id = add_cover(cover_url, ekey, account=account)
+    if cover_id:
+        edition['covers'] = [cover_id]
+
+    edits = []  # Things (Edition, Work, Authors) to be saved
+    reply = {}
+    # TOFIX: edition.authors has already been processed by import_authors() in build_query(), following line is a NOP?
+    author_in = [import_author(a, eastern=east_in_by_statement(rec, a)) for a in edition.get('authors', [])]
+    # build_author_reply() adds authors to edits
+    (authors, author_reply) = build_author_reply(author_in, edits)
+
+    if authors:
+        edition['authors'] = authors
+        reply['authors'] = author_reply
+
+    wkey = None
+    work_state = 'created'
+    # Look for an existing work
+    if 'authors' in edition:
+        wkey = find_matching_work(edition)
+    if wkey:
+        w = web.ctx.site.get(wkey)
+        work_state = 'matched'
+        found_wkey_match = True
+        need_update = False
+        for k in subject_fields:
+            if k not in rec:
+                continue
+            for s in rec[k]:
+                if normalize(s) not in [normalize(existing) for existing in w.get(k, [])]:
+                    w.setdefault(k, []).append(s)
+                    need_update = True
+        if cover_id:
+            w.setdefault('covers', []).append(cover_id)
+            need_update = True
+        if need_update:
+            work_state = 'modified'
+            edits.append(w.dict())
+    else:
+        # Create new work
+        w = new_work(edition, rec, cover_id)
+        wkey = w['key']
+        edits.append(w)
+
+    assert wkey
+    edition['works'] = [{'key': wkey}]
+    edition['key'] = ekey
+    edits.append(edition)
+
+    web.ctx.site.save_many(edits, comment='import new book', action='add-book')
+
+    # Writes back `openlibrary_edition` and `openlibrary_work` to
+    # archive.org item after successful import:
+    if 'ocaid' in rec:
+        update_ia_metadata_for_ol_edition(ekey.split('/')[-1])
+
+    reply['success'] = True
+    reply['edition'] = {'key': ekey, 'status': 'created'}
+    reply['work'] = {'key': wkey, 'status': work_state}
+    return reply
+
+
+def load(rec, account=None):
+    """Given a record, tries to add/match that edition in the system.
+
+    Record is a dictionary containing all the metadata of the edition.
+    The following fields are mandatory:
+
+        * title: str
+        * source_records: list
+
+    :param dict rec: Edition record to add
+    :rtype: dict
+    :return: a dict to be converted into a JSON HTTP response, same as load_data()
+    """
+    required_fields = ['title', 'source_records']  # ['authors', 'publishers', 'publish_date']
+    for field in required_fields:
+        if not rec.get(field):
+            raise RequiredField(field)
+    if isinstance(rec['source_records'], six.string_types):
+        rec['source_records'] = [rec['source_records']]
+
+    rec = normalize_record_isbns(rec)
+
+    edition_pool = build_pool(rec)
+    if not edition_pool:
+        # No match candidates found, add edition
+        return load_data(rec, account=account)
+
+    match = early_exit(rec)
+    if not match:
+        match = find_exact_match(rec, edition_pool)
+
+    if not match:
+        rec['full_title'] = rec['title']
+        if rec.get('subtitle'):
+            rec['full_title'] += ' ' + rec['subtitle']
+        e1 = build_marc(rec)
+        add_db_name(e1)
+        match = find_match(e1, edition_pool)
+
+    if not match:
+        # No match found, add edition
+        return load_data(rec, account=account)
+
+    # We have an edition match at this point
+    need_work_save = need_edition_save = False
+    w = None
+    e = web.ctx.site.get(match)
+    # check for, and resolve, author redirects
+    for a in e.authors:
+        while is_redirect(a):
+            if a in e.authors:
+                e.authors.remove(a)
+            a = web.ctx.site.get(a.location)
+            if not is_redirect(a):
+                e.authors.append(a)
+
+    if e.get('works'):
+        w = e.works[0].dict()
+        work_created = False
+    else:
+        # Found an edition without a work
+        work_created = need_work_save = need_edition_save = True
+        w = new_work(e.dict(), rec)
+        e.works = [{'key': w['key']}]
+
+    # Add subjects to work, if not already present
+    if 'subjects' in rec:
+        work_subjects = list(w.get('subjects', []))
+        for s in rec['subjects']:
+            if s not in work_subjects:
+                work_subjects.append(s)
+                need_work_save = True
+        if need_work_save and work_subjects:
+            w['subjects'] = work_subjects
+
+    # Add cover to edition
+    if 'cover' in rec and not e.get_covers():
+        cover_url = rec['cover']
+        cover_id = add_cover(cover_url, e.key, account=account)
+        if cover_id:
+            e['covers'] = [cover_id]
+            need_edition_save = True
+
+    # Add cover to work, if needed
+    if not w.get('covers') and e.get_covers():
+        w['covers'] = [e['covers'][0]]
+        need_work_save = True
+
+    # Add description to work, if needed
+    if not w.get('description') and e.get('description'):
+        w['description'] = e['description']
+        need_work_save = True
+
+    # Add authors to work, if needed
+    if not w.get('authors'):
+        authors = [import_author(a) for a in rec.get('authors', [])]
+        w['authors'] = [{'type':{'key': '/type/author_role'}, 'author': a.key} for a in authors if a.get('key')]
+        if w.get('authors'):
+            need_work_save = True
+
+    # Add ocaid to edition (str), if needed
+    if 'ocaid' in rec and not e.ocaid:
+        e['ocaid'] = rec['ocaid']
+        need_edition_save = True
+
+    edition_fields = [
+        'local_id', 'ia_box_id', 'ia_loaded_id', 'source_records']
+    # TODO:
+    # only consider `source_records` for newly created work
+    # or if field originally missing:
+    #if work_created and not e.get('source_records'):
+    #    edition_fields.append('source_records')
+    for f in edition_fields:
+        if f not in rec:
+            continue
+        # ensure values is a list
+        values = rec[f] if isinstance(rec[f], list) else [rec[f]]
+        if f in e:
+            # get values from rec that are not currently on the edition
+            to_add = [v for v in values if v not in e[f]]
+            e[f] += to_add
+        else:
+            e[f] = to_add = values
+        if to_add:
+            need_edition_save = True
+
+    edits = []
+    reply = {
+        'success': True,
+        'edition': {'key': match, 'status': 'matched'},
+        'work': {'key': w['key'], 'status': 'matched'},
+    }
+    if need_edition_save:
+        reply['edition']['status'] = 'modified'
+        edits.append(e.dict())
+    if need_work_save:
+        reply['work']['status'] = 'created' if work_created else 'modified'
+        edits.append(w)
+    if edits:
+        web.ctx.site.save_many(edits, comment='import existing book', action='edit-book')
+    if 'ocaid' in rec:
+        update_ia_metadata_for_ol_edition(match.split('/')[-1])
+    return reply
diff --git a/ia-legacy-importer/add_book/load_book.py b/ia-legacy-importer/add_book/load_book.py
new file mode 100644
index 00000000..a226bc32
--- /dev/null
+++ b/ia-legacy-importer/add_book/load_book.py
@@ -0,0 +1,224 @@
+import web
+import re
+from openlibrary.catalog.utils import flip_name, author_dates_match, key_int
+
+
+def east_in_by_statement(rec, author):
+    """
+    Returns False if there is no by_statement in rec.
+    Otherwise returns whether author name uses eastern name order.
+    TODO: elaborate on what this actually means, and how it is used.
+
+    :param dict rec: import source edition record
+    :param dict author: import source author dict: {"name": "Some One"}
+    :rtype: bool
+    """
+
+    if 'by_statement' not in rec:
+        return False
+    if 'authors' not in rec:
+        return False
+    name = author['name']
+    flipped = flip_name(name)
+    name = name.replace('.', '')
+    name = name.replace(', ', '')
+    if name == flipped.replace('.', ''):
+        # name was not flipped
+        return False
+    return rec['by_statement'].find(name) != -1
+
+
+def do_flip(author):
+    """
+    Given an author import dict, flip its name in place
+    i.e. Smith, John => John Smith
+
+    :param dict author:
+    :rtype: None
+    """
+    if 'personal_name' not in author:
+        return
+    if author['personal_name'] != author['name']:
+        return
+    first_comma = author['name'].find(', ')
+    if first_comma == -1:
+        return
+    # e.g: Harper, John Murdoch, 1845-
+    if author['name'].find(',', first_comma + 1) != -1:
+        return
+    if author['name'].find('i.e.') != -1:
+        return
+    if author['name'].find('i. e.') != -1:
+        return
+    name = flip_name(author['name'])
+    author['name'] = name
+    author['personal_name'] = name
+
+
+def pick_from_matches(author, match):
+    """
+    Finds the best match for author from a list of OL authors records, match.
+
+    :param dict author: Author import representation
+    :param list match: List of matching OL author records
+    :rtype: dict
+    :return: A single OL author record from match
+    """
+    maybe = []
+    if 'birth_date' in author and 'death_date' in author:
+        maybe = [m for m in match if 'birth_date' in m and 'death_date' in m]
+    elif 'date' in author:
+        maybe = [m for m in match if 'date' in m]
+    if not maybe:
+        maybe = match
+    if len(maybe) == 1:
+        return maybe[0]
+    return min(maybe, key=key_int)
+
+
+def find_author(name):
+    """
+    Searches OL for an author by name.
+
+    :param str name: Author's name
+    :rtype: list
+    :return: A list of OL author representations than match name
+    """
+    def walk_redirects(obj, seen):
+        seen.add(obj['key'])
+        while obj['type']['key'] == '/type/redirect':
+            assert obj['location'] != obj['key']
+            obj = web.ctx.site.get(obj['location'])
+            seen.add(obj['key'])
+        return obj
+
+    q = {'type': '/type/author', 'name': name} # FIXME should have no limit
+    reply = list(web.ctx.site.things(q))
+    authors = [web.ctx.site.get(k) for k in reply]
+    if any(a.type.key != '/type/author' for a in authors):
+        seen = set()
+        authors = [walk_redirects(a, seen) for a in authors if a['key'] not in seen]
+    return authors
+
+
+def find_entity(author):
+    """
+    Looks for an existing Author record in OL by name
+    and returns it if found.
+
+    :param dict author: Author import dict {"name": "Some One"}
+    :rtype: dict|None
+    :return: Existing Author record, if one is found
+    """
+    name = author['name']
+    things = find_author(name)
+    et = author.get('entity_type')
+    if et and et != 'person':
+        if not things:
+            return None
+        db_entity = things[0]
+        assert db_entity['type']['key'] == '/type/author'
+        return db_entity
+    if ', ' in name:
+        things += find_author(flip_name(name))
+    match = []
+    seen = set()
+    for a in things:
+        key = a['key']
+        if key in seen:
+            continue
+        seen.add(key)
+        orig_key = key
+        assert a.type.key == '/type/author'
+        if 'birth_date' in author and 'birth_date' not in a:
+            continue
+        if 'birth_date' not in author and 'birth_date' in a:
+            continue
+        if not author_dates_match(author, a):
+            continue
+        match.append(a)
+    if not match:
+        return None
+    if len(match) == 1:
+        return match[0]
+    return pick_from_matches(author, match)
+
+
+def import_author(author, eastern=False):
+    """
+    Converts an import style new-author dictionary into an
+    Open Library existing author, or new author candidate, representation.
+    Does NOT create new authors.
+
+    :param dict author: Author import record {"name": "Some One"}
+    :param bool eastern: Eastern name order
+    :rtype: dict
+    :return: Open Library style Author representation, either exisiting with "key",
+             or new candidate without "key".
+    """
+    existing = find_entity(author)
+    if existing:
+        assert existing.type.key == '/type/author'
+        for k in 'last_modified', 'id', 'revision', 'created':
+            if existing.k:
+                del existing.k
+        new = existing
+        if 'death_date' in author and 'death_date' not in existing:
+            new['death_date'] = author['death_date']
+        return new
+    if not eastern:
+        do_flip(author)
+    a = {'type': {'key': '/type/author'}}
+    for f in 'name', 'title', 'personal_name', 'birth_date', 'death_date', 'date':
+        if f in author:
+            a[f] = author[f]
+    return a
+
+
+class InvalidLanguage(Exception):
+    def __init__(self, code):
+        self.code = code
+    def __str__(self):
+        return "invalid language code: '%s'" % self.code
+
+
+type_map = { 'description': 'text', 'notes': 'text', 'number_of_pages': 'int' }
+
+
+def build_query(rec):
+    """
+    Takes an edition record dict, rec, and returns an Open Library edition
+    suitable for saving.
+
+    :param dict rec: Edition record to add to Open Library
+    :rtype: dict
+    :return: Open Library style edition representation
+    """
+    book = {
+        'type': { 'key': '/type/edition'},
+    }
+
+    for k, v in rec.iteritems():
+        if k == 'authors':
+            if v and v[0]:
+                book['authors'] = []
+                for author in v:
+                    east = east_in_by_statement(rec, author)
+                    book['authors'].append(import_author(author, eastern=east))
+            continue
+        if k == 'languages':
+            langs = []
+            for l in v:
+                if web.ctx.site.get('/languages/' + l) is None:
+                    raise InvalidLanguage(l)
+            book['languages'] = [{'key': '/languages/' + l} for l in v]
+            continue
+        if k in type_map:
+            t = '/type/' + type_map[k]
+            if isinstance(v, list):
+                book[k] = [{'type': t, 'value': i} for i in v]
+            else:
+                book[k] = {'type': t, 'value': v}
+        else:
+            book[k] = v
+    return book
diff --git a/ia-legacy-importer/add_book/merge.py b/ia-legacy-importer/add_book/merge.py
new file mode 100644
index 00000000..15c8a60d
--- /dev/null
+++ b/ia-legacy-importer/add_book/merge.py
@@ -0,0 +1,50 @@
+from openlibrary.catalog.merge.merge_marc import build_marc, attempt_merge
+import web
+
+threshold = 875
+
+def db_name(a):
+    date = None
+    if a.birth_date or a.death_date:
+        date = a.get('birth_date', '') + '-' + a.get('death_date', '')
+    elif a.date:
+        date = a.date
+    return ' '.join([a['name'], date]) if date else a['name']
+
+# FIXME: badly named. edition_record_equal? (candidate_ed, existing_ed)
+def try_merge(e1, edition_key, existing):
+    """
+    Converts the existing edition into a comparable dict and performs a
+    thresholded comparison to decide whether they are the same.
+    Used by add_book.load() -> add_book.find_match() to check whether two
+    editions match.
+
+    :param dict e1: Output of build_marc(import record candidate)
+    :param str edition_key: edition key of existing
+    :param Thing existing: Edition object to be tested against e1, the object of edition_key
+    :rtype: bool
+    :return: Whether e1 is sufficiently the same as the 'existing' edition
+    """
+
+    thing_type = existing.type.key
+    if thing_type == '/type/delete':
+        return False
+    # FIXME: will fail if existing is a redirect.
+    assert thing_type == '/type/edition'
+    rec2 = {}
+    rec2['full_title'] = existing.title
+    if existing.subtitle:
+        rec2['full_title'] += ' ' + existing.subtitle
+    for f in 'isbn', 'isbn_10', 'isbn_13', 'lccn', 'publish_country', 'publishers', 'publish_date':
+        if existing.get(f):
+            rec2[f] = existing[f]
+    if existing.authors:
+        rec2['authors'] = []
+        for a in existing.authors:
+            while a.type.key == '/type/redirect':
+                a = web.ctx.site.get(a.location)
+            if a.type.key == '/type/author':
+                assert a['name']
+                rec2['authors'].append({'name': a['name'], 'db_name': db_name(a)})
+    e2 = build_marc(rec2)
+    return attempt_merge(e1, e2, threshold)
diff --git a/ia-legacy-importer/add_book/test_add_book.py b/ia-legacy-importer/add_book/test_add_book.py
new file mode 100644
index 00000000..5dcf4206
--- /dev/null
+++ b/ia-legacy-importer/add_book/test_add_book.py
@@ -0,0 +1,840 @@
+from __future__ import print_function
+
+import os
+import pytest
+
+from copy import deepcopy
+from collections import defaultdict
+
+from infogami.infobase.core import Text
+
+from openlibrary.catalog import add_book
+from openlibrary.catalog.add_book import add_db_name, build_pool, editions_matched, isbns_from_record, load, RequiredField
+from openlibrary.catalog.add_book.load_book import build_query, InvalidLanguage
+from openlibrary.catalog.add_book.merge import try_merge
+
+from openlibrary.catalog.merge.merge_marc import build_marc
+from openlibrary.catalog.marc.parse import read_edition
+from openlibrary.catalog.marc.marc_binary import MarcBinary, BadLength, BadMARC
+
+
+from six.moves.urllib.request import urlopen
+
+
+def open_test_data(filename):
+    """Returns a file handle to file with specified filename inside test_data directory.
+    """
+    root = os.path.dirname(__file__)
+    fullpath = os.path.join(root, 'test_data', filename)
+    return open(fullpath)
+
+@pytest.fixture
+def add_languages(mock_site):
+    languages = [
+        ('eng', 'English'),
+        ('spa', 'Spanish'),
+        ('fre', 'French'),
+        ('yid', 'Yiddish'),
+    ]
+    for code, name in languages:
+        mock_site.save({
+            'key': '/languages/' + code,
+            'name': name,
+            'type': {'key': '/type/language'},
+        })
+
+@pytest.fixture
+def ia_writeback(monkeypatch):
+    """Prevent ia writeback from making live requests.
+    """
+    monkeypatch.setattr(add_book, 'update_ia_metadata_for_ol_edition', lambda olid: {})
+
+def test_build_query(add_languages):
+    rec = {
+        'title': 'magic',
+        'languages': ['eng', 'fre'],
+        'authors': [{}],
+        'description': 'test',
+    }
+    q = build_query(rec)
+    assert q['title'] == 'magic'
+    assert q['description'] == {'type': '/type/text', 'value': 'test'}
+    assert q['type'] == {'key': '/type/edition'}
+    assert q['languages'] == [{'key': '/languages/eng'}, {'key': '/languages/fre'}]
+
+    pytest.raises(InvalidLanguage, build_query, {'languages': ['wtf']})
+
+def test_isbns_from_record():
+    rec = {'title': 'test', 'isbn_13': ['9780190906764'], 'isbn_10': ['0190906766']}
+    result = isbns_from_record(rec)
+    assert isinstance(result, list)
+    assert '9780190906764' in result
+    assert '0190906766' in result
+    assert len(result) == 2
+
+def test_editions_matched_no_results(mock_site):
+    rec = {'title': 'test', 'isbn_13': ['9780190906764'], 'isbn_10': ['0190906766']}
+    isbns = isbns_from_record(rec)
+    result = editions_matched(rec, 'isbn_', isbns)
+    # returns no results because there are no existing editions
+    assert result == []
+
+def test_editions_matched(mock_site, add_languages, ia_writeback):
+    rec = {'title': 'test', 'isbn_13': ['9780190906764'], 'isbn_10': ['0190906766'], 'source_records': ['test:001']}
+    load(rec)
+    isbns = isbns_from_record(rec)
+
+    result_10 = editions_matched(rec, 'isbn_10', '0190906766')
+    assert result_10 == ['/books/OL1M']
+
+    result_13 = editions_matched(rec, 'isbn_13', '9780190906764')
+    assert result_13 == ['/books/OL1M']
+
+    # searching on key isbn_ will return a matching record on either isbn_10 or isbn_13 metadata fields
+    result = editions_matched(rec, 'isbn_', isbns)
+    assert result == ['/books/OL1M']
+
+def test_load_without_required_field():
+    rec = {'ocaid': 'test item'}
+    pytest.raises(RequiredField, load, {'ocaid': 'test_item'})
+
+def test_load_test_item(mock_site, add_languages, ia_writeback):
+    rec = {
+        'ocaid': 'test_item',
+        'source_records': ['ia:test_item'],
+        'title': 'Test item',
+        'languages': ['eng'],
+    }
+    reply = load(rec)
+    assert reply['success'] is True
+    assert reply['edition']['status'] == 'created'
+    e = mock_site.get(reply['edition']['key'])
+    assert e.type.key == '/type/edition'
+    assert e.title == 'Test item'
+    assert e.ocaid == 'test_item'
+    assert e.source_records == ['ia:test_item']
+    l = e.languages
+    assert len(l) == 1 and l[0].key == '/languages/eng'
+
+    assert reply['work']['status'] == 'created'
+    w = mock_site.get(reply['work']['key'])
+    assert w.title == 'Test item'
+    assert w.type.key == '/type/work'
+
+def test_load_with_subjects(mock_site, ia_writeback):
+    rec = {
+        'ocaid': 'test_item',
+        'title': 'Test item',
+        'subjects': ['Protected DAISY', 'In library'],
+        'source_records': 'ia:test_item',
+    }
+    reply = load(rec)
+    assert reply['success'] is True
+    w = mock_site.get(reply['work']['key'])
+    assert w.title == 'Test item'
+    assert w.subjects == ['Protected DAISY', 'In library']
+
+def test_load_with_new_author(mock_site, ia_writeback):
+    rec = {
+        'ocaid': 'test_item',
+        'title': 'Test item',
+        'authors': [{'name': 'John Doe'}],
+        'source_records': 'ia:test_item',
+    }
+    reply = load(rec)
+    assert reply['success'] is True
+    w = mock_site.get(reply['work']['key'])
+    assert reply['authors'][0]['status'] == 'created'
+    assert reply['authors'][0]['name'] == 'John Doe'
+    akey1 = reply['authors'][0]['key']
+    assert akey1 == '/authors/OL1A'
+    a = mock_site.get(akey1)
+    assert w.authors
+    assert a.type.key == '/type/author'
+
+    # Tests an existing author is modified if an Author match is found, and more data is provided
+    # This represents an edition of another work by the above author.
+    rec = {
+        'ocaid': 'test_item1b',
+        'title': 'Test item1b',
+        'authors': [{'name': 'Doe, John', 'entity_type': 'person'}],
+        'source_records': 'ia:test_item1b',
+    }
+    reply = load(rec)
+    assert reply['success'] is True
+    assert reply['edition']['status'] == 'created'
+    assert reply['work']['status'] == 'created'
+    akey2 = reply['authors'][0]['key']
+
+    # TODO: There is no code that modifies an author if more data is provided.
+    # previously the status implied the record was always 'modified', when a match was found.
+    #assert reply['authors'][0]['status'] == 'modified'
+    #a = mock_site.get(akey2)
+    #assert 'entity_type' in a
+    #assert a.entity_type == 'person'
+
+    assert reply['authors'][0]['status'] == 'matched'
+    assert akey1 == akey2 == '/authors/OL1A'
+
+    # Tests same title with different ocaid and author is not overwritten
+    rec = {
+        'ocaid': 'test_item2',
+        'title': 'Test item',
+        'authors': [{'name': 'James Smith'}],
+        'source_records': 'ia:test_item2',
+    }
+    reply = load(rec)
+    akey3 = reply['authors'][0]['key']
+    assert akey3 == '/authors/OL2A'
+    assert reply['authors'][0]['status'] == 'created'
+    assert reply['work']['status'] == 'created'
+    assert reply['edition']['status'] == 'created'
+    w = mock_site.get(reply['work']['key'])
+    e = mock_site.get(reply['edition']['key'])
+    assert e.ocaid == 'test_item2'
+    assert len(w.authors) == 1
+    assert len(e.authors) == 1
+
+def test_load_with_redirected_author(mock_site, add_languages):
+    """Test importing existing editions without works
+       which have author redirects. A work should be created with
+       the final author.
+    """
+    redirect_author = {
+        'type': {'key': '/type/redirect'},
+        'name': 'John Smith',
+        'key': '/authors/OL55A',
+        'location': '/authors/OL10A'}
+    final_author = {
+        'type': {'key': '/type/author'},
+        'name': 'John Smith',
+        'key': '/authors/OL10A'}
+    orphaned_edition = {
+        'title': 'Test item HATS',
+        'key': '/books/OL10M',
+        'publishers': ['TestPub'],
+        'publish_date': '1994',
+        'authors': [{'key': '/authors/OL55A'}],
+        'type': {'key': '/type/edition'}}
+    mock_site.save(orphaned_edition)
+    mock_site.save(redirect_author)
+    mock_site.save(final_author)
+
+    rec = {
+        'title': 'Test item HATS',
+        'authors': [{'name': 'John Smith'}],
+        'publishers': ['TestPub'],
+        'publish_date': '1994',
+        'source_records': 'ia:test_redir_author'}
+    reply = load(rec)
+    assert reply['edition']['status'] == 'modified'
+    assert reply['edition']['key'] == '/books/OL10M'
+    assert reply['work']['status'] == 'created'
+    e = mock_site.get(reply['edition']['key'])
+    assert e.authors[0].key == '/authors/OL10A'
+    w = mock_site.get(reply['work']['key'])
+    assert w.authors[0].author.key == '/authors/OL10A'
+
+def test_duplicate_ia_book(mock_site, add_languages, ia_writeback):
+    rec = {
+        'ocaid': 'test_item',
+        'source_records': ['ia:test_item'],
+        'title': 'Test item',
+        'languages': ['eng'],
+    }
+    reply = load(rec)
+    assert reply['success'] is True
+    assert reply['edition']['status'] == 'created'
+    e = mock_site.get(reply['edition']['key'])
+    assert e.type.key == '/type/edition'
+    assert e.source_records == ['ia:test_item']
+
+    rec = {
+        'ocaid': 'test_item',
+        'source_records': ['ia:test_item'],
+        # Titles MUST match to be considered the same
+        'title': 'Test item',
+        'languages': ['fre'],
+    }
+    reply = load(rec)
+    assert reply['success'] is True
+    assert reply['edition']['status'] == 'matched'
+
+def test_from_marc_3(mock_site, add_languages):
+    ia = 'treatiseonhistor00dixo'
+    data = open_test_data(ia + '_meta.mrc').read()
+    assert len(data) == int(data[:5])
+    rec = read_edition(MarcBinary(data))
+    rec['source_records'] = ['ia:' + ia]
+    reply = load(rec)
+    assert reply['success'] is True
+    assert reply['edition']['status'] == 'created'
+    e = mock_site.get(reply['edition']['key'])
+    assert e.type.key == '/type/edition'
+
+def test_from_marc_2(mock_site, add_languages):
+    ia = 'roadstogreatness00gall'
+    data = open_test_data(ia + '_meta.mrc').read()
+    assert len(data) == int(data[:5])
+    rec = read_edition(MarcBinary(data))
+    rec['source_records'] = ['ia:' + ia]
+    reply = load(rec)
+    assert reply['success'] is True
+    assert reply['edition']['status'] == 'created'
+    e = mock_site.get(reply['edition']['key'])
+    assert e.type.key == '/type/edition'
+    reply = load(rec)
+    assert reply['success'] is True
+    assert reply['edition']['status'] == 'matched'
+
+def test_from_marc(mock_site, add_languages):
+    ia = 'flatlandromanceo00abbouoft'
+    data = open_test_data(ia + '_meta.mrc').read()
+    assert len(data) == int(data[:5])
+    rec = read_edition(MarcBinary(data))
+    reply = load(rec)
+    assert reply['success'] is True
+    akey1 = reply['authors'][0]['key']
+    a = mock_site.get(akey1)
+    assert a.type.key == '/type/author'
+    assert a.name == 'Edwin Abbott Abbott'
+    assert a.birth_date == '1838'
+    assert a.death_date == '1926'
+
+def test_author_from_700(mock_site, add_languages):
+    ia = 'sexuallytransmit00egen'
+    data = open_test_data(ia + '_meta.mrc').read()
+    rec = read_edition(MarcBinary(data))
+    rec['source_records'] = ['ia:' + ia]
+    reply = load(rec)
+    assert reply['success'] is True
+    # author from 700
+    akey = reply['authors'][0]['key']
+    a = mock_site.get(akey)
+    assert a.type.key == '/type/author'
+    assert a.name == 'Laura K. Egendorf'
+    assert a.birth_date == '1973'
+
+def test_from_marc_fields(mock_site, add_languages):
+    ia = 'isbn_9781419594069'
+    data = open_test_data(ia + '_meta.mrc').read()
+    rec = read_edition(MarcBinary(data))
+    rec['source_records'] = ['ia:' + ia]
+    reply = load(rec)
+    assert reply['success'] is True
+    # author from 100
+    assert reply['authors'][0]['name'] == 'Adam Weiner'
+
+    edition = mock_site.get(reply['edition']['key'])
+    # Publish place, publisher, & publish date - 260$a, $b, $c
+    assert edition['publishers'][0] == 'Kaplan Publishing'
+    assert edition['publish_date'] == '2007'
+    assert edition['publish_places'][0] == 'New York'
+    # Pagination 300
+    assert edition['number_of_pages'] == 264
+    assert edition['pagination'] == 'viii, 264 p.'
+    # 8 subjects, 650
+    assert len(edition['subjects']) == 8
+    assert edition['subjects'] == [u'Action and adventure films',
+                                   u'Miscellanea',
+                                   u'Physics',
+                                   u'Cinematography',
+                                   u'Special effects',
+                                   u'Physics in motion pictures',
+                                   u'Science fiction films',
+                                   u'Popular works']
+    # Edition description from 520
+    desc = 'Explains the basic laws of physics, covering such topics as mechanics, forces, and energy, while deconstructing famous scenes and stunts from motion pictures, including "Apollo 13" and "Titanic," to determine if they are possible.'
+    assert isinstance(edition['description'], Text)
+    assert edition['description'] == desc
+    # Work description from 520
+    work = mock_site.get(reply['work']['key'])
+    assert isinstance(work['description'], Text)
+    assert work['description'] == desc
+
+def test_build_pool(mock_site):
+    assert build_pool({'title': 'test'}) == {}
+    etype = '/type/edition'
+    ekey = mock_site.new_key(etype)
+    e = {
+        'title': 'test',
+        'type': {'key': etype},
+        'lccn': ['123'],
+        'oclc_numbers': ['456'],
+        'ocaid': 'test00test',
+        'key': ekey,
+    }
+
+    mock_site.save(e)
+    pool = build_pool(e)
+    assert pool == {
+        'lccn': ['/books/OL1M'],
+        'oclc_numbers': ['/books/OL1M'],
+        'title': ['/books/OL1M'],
+        'ocaid': ['/books/OL1M']
+    }
+
+    pool = build_pool({'lccn': ['234'], 'oclc_numbers': ['456'], 'title': 'test', 'ocaid': 'test00test'})
+    assert pool == { 'oclc_numbers': ['/books/OL1M'], 'title': ['/books/OL1M'], 'ocaid': ['/books/OL1M'] }
+
+def test_try_merge(mock_site):
+    rec = {
+        'title': 'Test item',
+        'lccn': ['123'],
+        'authors': [{'name': 'Smith, John', 'birth_date': '1980'}],
+        'source_records': ['ia:test_item'],
+    }
+    reply = load(rec)
+    ekey = reply['edition']['key']
+    e = mock_site.get(ekey)
+
+    rec['full_title'] = rec['title']
+    e1 = build_marc(rec)
+    add_db_name(e1)
+    result = try_merge(e1, ekey, e)
+    assert result is True
+
+def test_load_multiple(mock_site):
+    rec = {
+        'title': 'Test item',
+        'lccn': ['123'],
+        'source_records': ['ia:test_item'],
+        'authors': [{'name': 'Smith, John', 'birth_date': '1980'}],
+    }
+    reply = load(rec)
+    assert reply['success'] is True
+    ekey1 = reply['edition']['key']
+
+    reply = load(rec)
+    assert reply['success'] is True
+    ekey2 = reply['edition']['key']
+    assert ekey1 == ekey2
+
+    reply = load({'title': 'Test item', 'source_records': ['ia:test_item2'], 'lccn': ['456']})
+    assert reply['success'] is True
+    ekey3 = reply['edition']['key']
+    assert ekey3 != ekey1
+
+    reply = load(rec)
+    assert reply['success'] is True
+    ekey4 = reply['edition']['key']
+
+    assert ekey1 == ekey2 == ekey4
+
+def test_add_db_name():
+    authors = [
+        {'name': 'Smith, John' },
+        {'name': 'Smith, John', 'date': '1950' },
+        {   'name': 'Smith, John',
+            'birth_date': '1895',
+            'death_date': '1964' },
+    ]
+    orig = deepcopy(authors)
+    add_db_name({'authors': authors})
+    orig[0]['db_name'] = orig[0]['name']
+    orig[1]['db_name'] = orig[1]['name'] + ' 1950'
+    orig[2]['db_name'] = orig[2]['name'] + ' 1895-1964'
+    assert authors == orig
+
+    rec = {}
+    add_db_name(rec)
+    assert rec == {}
+
+def test_from_marc(mock_site, add_languages):
+    ia = 'coursepuremath00hardrich'
+    marc = MarcBinary(open_test_data(ia + '_meta.mrc').read())
+    rec = read_edition(marc)
+    rec['source_records'] = ['ia:' + ia]
+    reply = load(rec)
+    assert reply['success'] is True
+    assert reply['edition']['status'] == 'created'
+    reply = load(rec)
+    assert reply['success'] is True
+    assert reply['edition']['status'] == 'matched'
+
+    ia = 'flatlandromanceo00abbouoft'
+    marc = MarcBinary(open_test_data(ia + '_meta.mrc').read())
+
+    rec = read_edition(marc)
+    rec['source_records'] = ['ia:' + ia]
+    reply = load(rec)
+    assert reply['success'] is True
+    assert reply['edition']['status'] == 'created'
+    reply = load(rec)
+    assert reply['success'] is True
+    assert reply['edition']['status'] == 'matched'
+
+def test_real_example(mock_site, add_languages):
+    src = 'v38.i37.records.utf8--16478504-1254'
+    marc = MarcBinary(open_test_data(src).read())
+    rec = read_edition(marc)
+    rec['source_records'] = ['marc:' + src]
+    reply = load(rec)
+    assert reply['success'] is True
+    reply = load(rec)
+    assert reply['success'] is True
+    assert reply['edition']['status'] == 'matched'
+
+    src = 'v39.i28.records.utf8--5362776-1764'
+    marc = MarcBinary(open_test_data(src).read())
+    rec = read_edition(marc)
+    rec['source_records'] = ['marc:' + src]
+    reply = load(rec)
+    assert reply['success'] is True
+    assert reply['edition']['status'] == 'modified'
+
+def test_missing_ocaid(mock_site, add_languages, ia_writeback):
+    ia = 'descendantsofhug00cham'
+    src = ia + '_meta.mrc'
+    marc = MarcBinary(open_test_data(src).read())
+    rec = read_edition(marc)
+    rec['source_records'] = ['marc:testdata.mrc']
+    reply = load(rec)
+    assert reply['success'] is True
+    rec['source_records'] = ['ia:' + ia]
+    rec['ocaid'] = ia
+    reply = load(rec)
+    assert reply['success'] is True
+    e = mock_site.get(reply['edition']['key'])
+    assert e.ocaid == ia
+    assert 'ia:' + ia in e.source_records
+
+def test_extra_author(mock_site, add_languages):
+    mock_site.save({
+        "name": "Hubert Howe Bancroft",
+        "death_date": "1918.",
+        "alternate_names": ["HUBERT HOWE BANCROFT", "Hubert Howe Bandcroft"],
+        "key": "/authors/OL563100A",
+        "birth_date": "1832",
+        "personal_name": "Hubert Howe Bancroft",
+        "type": {"key": "/type/author"},
+    })
+
+    mock_site.save({
+        "title": "The works of Hubert Howe Bancroft",
+        "covers": [6060295, 5551343],
+        "first_sentence": {"type": "/type/text", "value": "When it first became known to Europe that a new continent had been discovered, the wise men, philosophers, and especially the learned ecclesiastics, were sorely perplexed to account for such a discovery."},
+        "subject_places": ["Alaska", "America", "Arizona", "British Columbia", "California", "Canadian Northwest", "Central America", "Colorado", "Idaho", "Mexico", "Montana", "Nevada", "New Mexico", "Northwest Coast of North America", "Northwest boundary of the United States", "Oregon", "Pacific States", "Texas", "United States", "Utah", "Washington (State)", "West (U.S.)", "Wyoming"],
+        "excerpts": [{"excerpt": "When it first became known to Europe that a new continent had been discovered, the wise men, philosophers, and especially the learned ecclesiastics, were sorely perplexed to account for such a discovery."}],
+        "first_publish_date": "1882",
+        "key": "/works/OL3421434W",
+        "authors": [{"type": {"key": "/type/author_role"}, "author": {"key": "/authors/OL563100A"}}],
+        "subject_times": ["1540-1810", "1810-1821", "1821-1861", "1821-1951", "1846-1850", "1850-1950", "1859-", "1859-1950", "1867-1910", "1867-1959", "1871-1903", "Civil War, 1861-1865", "Conquest, 1519-1540", "European intervention, 1861-1867", "Spanish colony, 1540-1810", "To 1519", "To 1821", "To 1846", "To 1859", "To 1867", "To 1871", "To 1889", "To 1912", "Wars of Independence, 1810-1821"],
+        "type": {"key": "/type/work"},
+        "subjects": ["Antiquities", "Archaeology", "Autobiography", "Bibliography", "California Civil War, 1861-1865", "Comparative Literature", "Comparative civilization", "Courts", "Description and travel", "Discovery and exploration", "Early accounts to 1600", "English essays", "Ethnology", "Foreign relations", "Gold discoveries", "Historians", "History", "Indians", "Indians of Central America", "Indians of Mexico", "Indians of North America", "Languages", "Law", "Mayas", "Mexican War, 1846-1848", "Nahuas", "Nahuatl language", "Oregon question", "Political aspects of Law", "Politics and government", "Religion and mythology", "Religions", "Social life and customs", "Spanish", "Vigilance committees", "Writing", "Zamorano 80", "Accessible book", "Protected DAISY"]
+    })
+
+    ia = 'workshuberthowe00racegoog'
+    src = ia + '_meta.mrc'
+    marc = MarcBinary(open_test_data(src).read())
+    rec = read_edition(marc)
+    rec['source_records'] = ['ia:' + ia]
+
+    reply = load(rec)
+    assert reply['success'] is True
+
+    w = mock_site.get(reply['work']['key'])
+
+    reply = load(rec)
+    assert reply['success'] is True
+    w = mock_site.get(reply['work']['key'])
+    assert len(w['authors']) == 1
+
+def test_missing_source_records(mock_site, add_languages):
+    mock_site.save({
+        'key': '/authors/OL592898A',
+        'name': 'Michael Robert Marrus',
+        'personal_name': 'Michael Robert Marrus',
+        'type': { 'key': '/type/author' }
+    })
+
+    mock_site.save({
+        'authors': [{'author': '/authors/OL592898A', 'type': { 'key': '/type/author_role' }}],
+        'key': '/works/OL16029710W',
+        'subjects': ['Nuremberg Trial of Major German War Criminals, Nuremberg, Germany, 1945-1946', 'Protected DAISY', 'Lending library'],
+        'title': 'The Nuremberg war crimes trial, 1945-46',
+        'type': { 'key': '/type/work' },
+    })
+
+    mock_site.save({
+        "number_of_pages": 276,
+        "subtitle": "a documentary history",
+        "series": ["The Bedford series in history and culture"],
+        "covers": [6649715, 3865334, 173632],
+        "lc_classifications": ["D804.G42 N87 1997"],
+        "ocaid": "nurembergwarcrim00marr",
+        "contributions": ["Marrus, Michael Robert."],
+        "uri_descriptions": ["Book review (H-Net)"],
+        "title": "The Nuremberg war crimes trial, 1945-46",
+        "languages": [{"key": "/languages/eng"}],
+        "subjects": ["Nuremberg Trial of Major German War Criminals, Nuremberg, Germany, 1945-1946"],
+        "publish_country": "mau", "by_statement": "[compiled by] Michael R. Marrus.",
+        "type": {"key": "/type/edition"},
+        "uris": ["http://www.h-net.org/review/hrev-a0a6c9-aa"],
+        "publishers": ["Bedford Books"],
+        "ia_box_id": ["IA127618"],
+        "key": "/books/OL1023483M",
+        "authors": [{"key": "/authors/OL592898A"}],
+        "publish_places": ["Boston"],
+        "pagination": "xi, 276 p. :",
+        "lccn": ["96086777"],
+        "notes": {"type": "/type/text", "value": "Includes bibliographical references (p. 262-268) and index."},
+        "identifiers": {"goodreads": ["326638"], "librarything": ["1114474"]},
+        "url": ["http://www.h-net.org/review/hrev-a0a6c9-aa"],
+        "isbn_10": ["031216386X", "0312136919"],
+        "publish_date": "1997",
+        "works": [{"key": "/works/OL16029710W"}]
+    })
+
+    ia = 'nurembergwarcrim1997marr'
+    src = ia + '_meta.mrc'
+    marc = MarcBinary(open_test_data(src).read())
+    rec = read_edition(marc)
+    rec['source_records'] = ['ia:' + ia]
+
+    reply = load(rec)
+    assert reply['success'] is True
+    e = mock_site.get(reply['edition']['key'])
+    assert 'source_records' in e
+
+def test_no_extra_author(mock_site, add_languages):
+    author = {
+        "name": "Paul Michael Boothe",
+        "key": "/authors/OL1A",
+        "type": {"key": "/type/author"},
+    }
+    mock_site.save(author)
+
+    work = {
+        "title": "A Separate Pension Plan for Alberta",
+        "covers": [1644794],
+        "key": "/works/OL1W",
+        "authors": [{"type": "/type/author_role", "author": {"key": "/authors/OL1A"}}],
+        "type": {"key": "/type/work"},
+    }
+    mock_site.save(work)
+
+    edition = {
+        "number_of_pages": 90,
+        "subtitle": "Analysis and Discussion (Western Studies in Economic Policy, No. 5)",
+        "weight": "6.2 ounces",
+        "covers": [1644794],
+        "latest_revision": 6,
+        "title": "A Separate Pension Plan for Alberta",
+        "languages": [{"key": "/languages/eng"}],
+        "subjects": ["Economics", "Alberta", "Political Science / State & Local Government", "Government policy", "Old age pensions", "Pensions", "Social security"],
+        "type": {"key": "/type/edition"},
+        "physical_dimensions": "9 x 6 x 0.2 inches",
+        "publishers": ["The University of Alberta Press"],
+        "physical_format": "Paperback",
+        "key": "/books/OL1M",
+        "authors": [{"key": "/authors/OL1A"}],
+        "identifiers": {"goodreads": ["4340973"], "librarything": ["5580522"]},
+        "isbn_13": ["9780888643513"],
+        "isbn_10": ["0888643519"],
+        "publish_date": "May 1, 2000",
+        "works": [{"key": "/works/OL1W"}]
+    }
+    mock_site.save(edition)
+
+    src = 'v39.i34.records.utf8--186503-1413'
+    marc = MarcBinary(open_test_data(src).read())
+    rec = read_edition(marc)
+    rec['source_records'] = ['marc:' + src]
+
+    reply = load(rec)
+    assert reply['success'] is True
+    assert reply['edition']['status'] == 'modified'
+    assert reply['work']['status'] == 'modified'
+    assert 'authors' not in reply
+
+    assert reply['edition']['key'] == edition['key']
+    assert reply['work']['key'] == work['key']
+
+    e = mock_site.get(reply['edition']['key'])
+    w = mock_site.get(reply['work']['key'])
+
+    assert 'source_records' in e
+    assert 'subjects' in w
+    assert len(e['authors']) == 1
+    assert len(w['authors']) == 1
+
+def test_don_quixote(mock_site):
+    """
+    All of these items are by 'Miguel de Cervantes Saavedra',
+    only one Author should be created. Some items have bad
+    MARC length, others are missing binary MARC altogether
+    and raise BadMARC exceptions.
+    """
+    pytest.skip("This test make live requests to archive.org")
+
+    dq = [u'lifeexploitsofin01cerv', u'cu31924096224518',
+        u'elingeniosedcrit04cerv', u'ingeniousgentlem01cervuoft',
+        u'historyofingenio01cerv', u'lifeexploitsofin02cerviala',
+        u'elingeniosohidal03cervuoft', u'nybc209000', u'elingeniosohidal11cerv',
+        u'elingeniosohidal01cervuoft', u'elingeniosoh01cerv',
+        u'donquixotedelama00cerviala', u'1896elingeniosohid02cerv',
+        u'ingeniousgentlem04cervuoft', u'cu31924027656978', u'histoiredeladmir01cerv',
+        u'donquijotedelama04cerv', u'cu31924027657075', u'donquixotedelama03cervuoft',
+        u'aventurasdedonqu00cerv', u'p1elingeniosohid03cerv',
+        u'geshikhefundonik01cervuoft', u'historyofvalorou02cerviala',
+        u'ingeniousgentlem01cerv', u'donquixotedelama01cervuoft',
+        u'ingeniousgentlem0195cerv', u'firstpartofdelig00cervuoft',
+        u'p4elingeniosohid02cerv', u'donquijote00cervuoft', u'cu31924008863924',
+        u'c2elingeniosohid02cerv', u'historyofvalorou03cerviala',
+        u'historyofingenio01cerviala', u'historyadventure00cerv',
+        u'elingeniosohidal00cerv', u'lifeexploitsofin01cervuoft',
+        u'p2elingeniosohid05cerv', u'nybc203136', u'elingeniosohidal00cervuoft',
+        u'donquixotedelama02cervuoft', u'lingnieuxcheva00cerv',
+        u'ingeniousgentlem03cerv', u'vidayhechosdeli00siscgoog',
+        u'lifeandexploits01jarvgoog', u'elingeniosohida00puiggoog',
+        u'elingeniosohida00navagoog', u'donquichottedel02florgoog',
+        u'historydonquixo00cogoog', u'vidayhechosdeli01siscgoog',
+        u'elingeniosohida28saavgoog', u'historyvalorous00brangoog',
+        u'elingeniosohida01goog', u'historyandadven00unkngoog',
+        u'historyvalorous01goog', u'ingeniousgentle11saavgoog',
+        u'elingeniosohida10saavgoog', u'adventuresdonqu00jarvgoog',
+        u'historydonquixo04saavgoog', u'lingnieuxcheval00rouxgoog',
+        u'elingeniosohida19saavgoog', u'historyingeniou00lalagoog',
+        u'elingeniosohida00ormsgoog', u'historyandadven01smolgoog',
+        u'elingeniosohida27saavgoog', u'elingeniosohida21saavgoog',
+        u'historyingeniou00mottgoog', u'historyingeniou03unkngoog',
+        u'lifeandexploits00jarvgoog', u'ingeniousgentle00conggoog',
+        u'elingeniosohida00quixgoog', u'elingeniosohida01saavgoog',
+        u'donquixotedelam02saavgoog', u'adventuresdonqu00gilbgoog',
+        u'historyingeniou02saavgoog', u'donquixotedelam03saavgoog',
+        u'elingeniosohida00ochogoog', u'historyingeniou08mottgoog',
+        u'lifeandexploits01saavgoog', u'firstpartdeligh00shelgoog',
+        u'elingeniosohida00castgoog', u'elingeniosohida01castgoog',
+        u'adventofdonquixo00cerv', u'portablecervante00cerv',
+        u'firstpartofdelig14cerv', u'donquixotemanofl00cerv',
+        u'firstpartofdelig00cerv']
+
+    bad_length = []
+    bad_marc = []
+
+    add_languages(mock_site)
+    edition_status_counts = defaultdict(int)
+    work_status_counts = defaultdict(int)
+    author_status_counts = defaultdict(int)
+
+    for ocaid in dq:
+        marc_url = 'https://archive.org/download/%s/%s_meta.mrc' % (ocaid, ocaid)
+        data = urlopen(marc_url).read()
+        try:
+            marc = MarcBinary(data)
+        except BadLength:
+            bad_length.append(ocaid)
+            continue
+        except BadMARC:
+            bad_marc.append(ocaid)
+            continue
+
+        rec = read_edition(marc)
+        rec['source_records'] = ['ia:' + ocaid]
+        reply = load(rec)
+
+        q = {
+            'type': '/type/work',
+            'authors.author': '/authors/OL1A',
+        }
+        work_keys = list(mock_site.things(q))
+        author_keys = list(mock_site.things({'type': '/type/author'}))
+        print("\nReply for %s: %s" % (ocaid, reply))
+        print("Work keys: %s" % work_keys)
+        assert author_keys == ['/authors/OL1A']
+        assert reply['success'] is True
+
+        # Increment status counters
+        edition_status_counts[reply['edition']['status']] += 1
+        work_status_counts[reply['work']['status']] += 1
+        if (reply['work']['status'] != 'matched') and (reply['edition']['status'] != 'modified'):
+            # No author key in response if work is 'matched'
+            # No author key in response if edition is 'modified'
+            author_status_counts[reply['authors'][0]['status']] += 1
+
+    print("BAD MARC LENGTH items: %s" % bad_length)
+    print("BAD MARC items: %s" % bad_marc)
+    print("Edition status counts: %s" % edition_status_counts)
+    print("Work status counts: %s" % work_status_counts)
+    print("Author status counts: %s" % author_status_counts)
+
+
+def test_same_twice(mock_site, add_languages):
+    rec = {
+            'source_records': ['ia:test_item'],
+            "publishers": ["Ten Speed Press"], "pagination": "20 p.", "description": "A macabre mash-up of the children's classic Pat the Bunny and the present-day zombie phenomenon, with the tactile features of the original book revoltingly re-imagined for an adult audience.", "title": "Pat The Zombie", "isbn_13": ["9781607740360"], "languages": ["eng"], "isbn_10": ["1607740362"], "authors": [{"entity_type": "person", "name": "Aaron Ximm", "personal_name": "Aaron Ximm"}], "contributions": ["Kaveh Soofi (Illustrator)"]}
+    reply = load(rec)
+    assert reply['success'] is True
+    assert reply['edition']['status'] == 'created'
+    assert reply['work']['status'] == 'created'
+
+    reply = load(rec)
+    assert reply['success'] is True
+    assert reply['edition']['status'] == 'matched'
+    assert reply['work']['status'] == 'matched'
+
+
+def test_existing_work(mock_site, add_languages):
+    author = {
+        'type': {'key': '/type/author'},
+        'name': 'John Smith',
+        'key': '/authors/OL20A'}
+    existing_work = {
+        'authors': [{'author': '/authors/OL20A', 'type': {'key': '/type/author_role'}}],
+        'key': '/works/OL16W',
+        'title': 'Finding existing works',
+        'type': {'key': '/type/work'},
+    }
+    mock_site.save(author)
+    mock_site.save(existing_work)
+    rec = {
+            'source_records': 'non-marc:test',
+            'title': 'Finding Existing Works',
+            'authors': [{'name': 'John Smith'}],
+            'publishers': ['Black Spot'],
+            'publish_date': 'Jan 09, 2011',
+            'isbn_10': ['1250144051'],
+           }
+
+    reply = load(rec)
+    assert reply['success'] is True
+    assert reply['edition']['status'] == 'created'
+    assert reply['work']['status'] == 'matched'
+    assert reply['work']['key'] == '/works/OL16W'
+    assert reply['authors'][0]['status'] == 'matched'
+    e = mock_site.get(reply['edition']['key'])
+    assert e.works[0]['key'] == '/works/OL16W'
+
+
+def test_existing_work_with_subtitle(mock_site, add_languages):
+    author = {
+        'type': {'key': '/type/author'},
+        'name': 'John Smith',
+        'key': '/authors/OL20A'}
+    existing_work = {
+        'authors': [{'author': '/authors/OL20A', 'type': {'key': '/type/author_role'}}],
+        'key': '/works/OL16W',
+        'title': 'Finding existing works',
+        'type': {'key': '/type/work'},
+    }
+    mock_site.save(author)
+    mock_site.save(existing_work)
+    rec = {
+            'source_records': 'non-marc:test',
+            'title': 'Finding Existing Works',
+            'subtitle': 'the ongoing saga!',
+            'authors': [{'name': 'John Smith'}],
+            'publishers': ['Black Spot'],
+            'publish_date': 'Jan 09, 2011',
+            'isbn_10': ['1250144051'],
+           }
+
+    reply = load(rec)
+    assert reply['success'] is True
+    assert reply['edition']['status'] == 'created'
+    assert reply['work']['status'] == 'matched'
+    assert reply['work']['key'] == '/works/OL16W'
+    assert reply['authors'][0]['status'] == 'matched'
+    e = mock_site.get(reply['edition']['key'])
+    assert e.works[0]['key'] == '/works/OL16W'
diff --git a/ia-legacy-importer/add_book/test_merge.py b/ia-legacy-importer/add_book/test_merge.py
new file mode 100644
index 00000000..781031a4
--- /dev/null
+++ b/ia-legacy-importer/add_book/test_merge.py
@@ -0,0 +1,47 @@
+import pytest
+import web
+
+from openlibrary.catalog.add_book.merge import try_merge
+from openlibrary.core.models import Edition
+from openlibrary.mocks.mock_infobase import MockSite
+
+@pytest.mark.skip("This should be tested, but tidy up deprecated methods first.")
+def test_try_merge():
+    web.ctx.site = MockSite()
+    bpl = {'authors': [{'birth_date': u'1897',
+                      'db_name': u'Green, Constance McLaughlin 1897-',
+                      'entity_type': 'person',
+                      'name': u'Green, Constance McLaughlin',
+                      'personal_name': u'Green, Constance McLaughlin'}],
+         'full_title': u'Eli Whitney and the birth of American technology',
+         'isbn': [u'188674632X'],
+         'normalized_title': u'eli whitney and the birth of american technology',
+         'number_of_pages': 215,
+         'publish_date': '1956',
+         'publishers': [u'HarperCollins', u'[distributed by Talman Pub.]'],
+         'short_title': u'eli whitney and the birth',
+         'source_record_loc': 'bpl101.mrc:0:1226',
+         'titles': [u'Eli Whitney and the birth of American technology',
+                    u'eli whitney and the birth of american technology']}
+    # This existing needs to be an Edition Thing object.
+    existing = {'authors': [{'birth_date': u'1897',
+                     'db_name': u'Green, Constance McLaughlin 1897-',
+                     'entity_type': 'person',
+                     'name': u'Green, Constance McLaughlin',
+                     'personal_name': u'Green, Constance McLaughlin'}],
+        'full_title': u'Eli Whitney and the birth of American technology.',
+        'isbn': [],
+        'normalized_title': u'eli whitney and the birth of american technology',
+        'number_of_pages': 215,
+        'publish_date': '1956',
+        'publishers': ['Little, Brown'],
+        'short_title': u'eli whitney and the birth',
+        'source_record_loc': 'marc_records_scriblio_net/part04.dat:119539872:591',
+        'title': 'Eli Whitney and the birth of American technology.',
+        'type': {'key': '/type/edition'},
+        'key': '/books/OL1M'}
+
+    web.ctx.site.save_many([existing])
+    ed = web.ctx.site.get('/books/OL1M')
+    assert try_merge(bpl, '/books/OL1M', ed) is True
+
diff --git a/ia-legacy-importer/amazon/__init__.py b/ia-legacy-importer/amazon/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/ia-legacy-importer/amazon/add_covers.py b/ia-legacy-importer/amazon/add_covers.py
new file mode 100644
index 00000000..545b3098
--- /dev/null
+++ b/ia-legacy-importer/amazon/add_covers.py
@@ -0,0 +1,37 @@
+from __future__ import print_function
+import simplejson
+
+from six.moves.urllib.request import urlopen
+
+
+base = 'http://ia331526.us.archive.org:7001/openlibrary.org/log/'
+
+out = open('edition_and_isbn', 'w')
+offset = '2009-06-01:0'
+while not offset.startswith('2010-03-17:'):
+    url = base + offset
+    ret = simplejson.load(urlopen(url))
+    offset, data = ret['offset'], ret['data']
+    print(offset, len(data))
+    for i in data:
+        action = i.pop('action')
+        key = i['data'].pop('key', None)
+        if action == 'new_account':
+            continue
+        author = i['data'].get('author', None) if 'data' in i else None
+        if author != '/user/ImportBot':
+            continue
+        assert action in ('save_many', 'save')
+        if action == 'save' and key.startswith('/b/'):
+            e = i['data']['query']
+            if e:
+                isbn = e.get('isbn_10', None)
+                if isbn:
+                    print((key, isbn), file=out)
+        elif action == 'save_many':
+            for e in i['data']['query']:
+                if e['type'] == '/type/edition' and e['key'].startswith('/b/'):
+                    isbn = e.get('isbn_10', None)
+                    if isbn:
+                        print((e['key'], isbn), file=out)
+out.close()
diff --git a/ia-legacy-importer/amazon/amazon_to_arc.py b/ia-legacy-importer/amazon/amazon_to_arc.py
new file mode 100644
index 00000000..ff88980a
--- /dev/null
+++ b/ia-legacy-importer/amazon/amazon_to_arc.py
@@ -0,0 +1,43 @@
+from __future__ import print_function
+import socket
+
+#url = "http://www.amazon.com/dp/1847195881"
+#asin = "1847195881"
+
+def get(sock, host, url):
+    send = 'GET %s HTTP/1.1\r\nHost: %s\r\nAccept-Encoding: identity\r\n\r\n' % (url, host)
+    sock.sendall(send)
+
+    fp = sock.makefile('rb', 0)
+
+    line = fp.readline()
+    print('status:', repr(line))
+
+    state = 'header'
+    for line in fp:
+        if line == '\r\n':
+            break
+        print('header', repr(line))
+
+    while True:
+        chunk_size = int(fp.readline(),16)
+        print(chunk_size)
+        if chunk_size == 0:
+            break
+        print(len(fp.read(chunk_size)))
+        print(repr(fp.read(2)))
+    line = fp.readline()
+    print(line)
+    fp.close()
+
+host = 'openlibrary.org'
+host = 'www.amazon.com'
+sock = socket.create_connection((host, 80))
+
+url = 'http://openlibrary.org/type/work'
+url = "http://www.amazon.com/dp/1847195881"
+get(sock, host, url)
+
+url = 'http://openlibrary.org/type/edition'
+url = "http://www.amazon.com/dp/0393062287"
+get(sock, host, url)
diff --git a/ia-legacy-importer/amazon/arc_index.py b/ia-legacy-importer/amazon/arc_index.py
new file mode 100644
index 00000000..898ed803
--- /dev/null
+++ b/ia-legacy-importer/amazon/arc_index.py
@@ -0,0 +1,23 @@
+from __future__ import print_function
+import os
+
+arc_dir = '/2/edward/amazon/arc'
+
+def read_arc(filename):
+    f = open(arc_dir + '/' + filename)
+    idx = open(arc_dir + '/' + filename + '.idx', 'w')
+    while True:
+        pos = f.tell()
+        line = f.readline()
+        if line == '':
+            break
+        print(pos, file=idx)
+        size = int(line[:-1].split(' ')[4])
+        f.read(size)
+        line = f.readline()
+    f.close()
+    idx.close()
+
+for filename in (i for i in os.listdir(arc_dir) if i.endswith('.arc')):
+    print(filename)
+    read_arc(filename)
diff --git a/ia-legacy-importer/amazon/arc_view.py b/ia-legacy-importer/amazon/arc_view.py
new file mode 100644
index 00000000..b277ba46
--- /dev/null
+++ b/ia-legacy-importer/amazon/arc_view.py
@@ -0,0 +1,65 @@
+import web
+import os
+from six import StringIO
+
+arc_dir = '/2/edward/amazon/arc'
+urls = (
+    '/', 'index',
+    '/(\d+\.arc)', 'arc_view',
+    '/(\d+\.arc)/(\d+)', 'page_view',
+)
+app = web.application(urls, globals(), autoreload=True)
+
+class arc_view:
+    def GET(self, filename):
+        ret = '<html><body>'
+        ret += '<a href="/">back to index</a><br>'
+        ret += '<h1>%s</h1>' % filename
+        idx = open(arc_dir + '/' + filename + '.idx')
+        arc = open(arc_dir + '/' + filename)
+        for pos in idx:
+            arc.seek(int(pos))
+            line = arc.readline()[:-1].split(' ')
+            ret += '<a href="%s/%d">from ARC</a> OR <a href="%s">original</a> %s <br>' % (filename, int(pos), line[0], line[0])
+        idx.close()
+
+        ret += '</body></html>'
+        return ret
+
+class page_view:
+    def GET(self, filename, offset):
+        arc = open(arc_dir + '/' + filename)
+        arc.seek(int(offset))
+        size = int(arc.readline().split(' ')[4])
+        f = StringIO(arc.read(size))
+        f.readline()
+        ret = ''
+        while True:
+            line=f.readline()
+            if line == '\r\n':
+                break
+        while True:
+            line = f.readline()
+            chunk_size = int(line, 16)
+            if chunk_size == 0:
+                break
+            buf = f.read(chunk_size)
+            ret += buf
+            f.readline()
+        return ret
+
+class index:
+    def GET(self):
+        ret = '<html><body><ul>'
+        for filename in os.listdir(arc_dir):
+            if not filename.endswith('.arc'):
+                continue
+            f = open(arc_dir + '/' + filename)
+            line = f.readline()
+            f.close()
+            ret += '<li><a href="/%s">%s</a> - %s' % (filename, filename, line)
+        ret += '</body></html>'
+        return ret
+
+if __name__ == "__main__":
+    app.run()
diff --git a/ia-legacy-importer/amazon/crawl.py b/ia-legacy-importer/amazon/crawl.py
new file mode 100644
index 00000000..a9027f1b
--- /dev/null
+++ b/ia-legacy-importer/amazon/crawl.py
@@ -0,0 +1,291 @@
+from __future__ import print_function
+from lxml.html import parse, tostring, fromstring
+import re
+import sys
+import os
+import socket
+from time import sleep
+from os.path import exists
+from datetime import date, timedelta, datetime
+import codecs
+
+from six.moves.urllib.parse import unquote
+from six.moves.urllib.request import urlopen
+
+
+# scrap Amazon for book and author data
+
+re_expect_end = re.compile('</div>\n</body>\n</html>[ \n]*$')
+
+# publisher = Big Idea Books & Just Me Music
+re_personalized = re.compile('Personalized for (.*) \((Boy|Girl)\)', re.I)
+
+def percent(a, b):
+    return float(a * 100.0) / b
+
+class PersonalizedBooks(Exception):
+    pass
+
+page_size = 12
+max_pages = 100
+max_results = page_size * max_pages
+
+# http://www.amazon.com/s/qid=1265761735/ref=sr_nr_n_0/177-5112913-4864616?ie=UTF8&rs=1000&bbn=1000&rnid=1000&rh=i%3Astripbooks%2Cp_n%5Ffeature%5Fbrowse-bin%3A618083011%2Cp%5Fn%5Fdate%3A20090101%2Cn%3A%211000%2Cn%3A1
+re_product_title = re.compile('/dp/([^/]*)')
+re_result_count = re.compile('Showing (?:[\d,]+ - [\d,]+ of )?([\d,]+) Result')
+#re_rh_n = re.compile('rh=n%3A(\d+)%2C')
+re_rh_n = re.compile('%2Cn%3A(\d+)')
+re_facet_count = re.compile(u'^\xa0\(([\d,]+)\)$')
+u'\xa0(8)'
+
+base_url = "http://www.amazon.com/s?ie=UTF8&rh="
+rh = 'i:stripbooks,p_n_feature_browse-bin:618083011,p_n_date:'
+
+out_dir = '/0/amazon'
+arc_dir = '/0/amazon/arc'
+
+# 4 = Children's Books, 28 = Teens
+re_child_book_param = re.compile(',n:(4|28)(?:&page=\d+)?$')
+
+def now():
+    return datetime.utcnow().replace(microsecond=0)
+
+max_size = 1024 * 1024 * 1024 * 10 # 10 GB
+ip = '207.241.229.141'
+content_type_hdr = 'Content-Type: '
+re_charset_header = re.compile('; charset=(.+)\r\n')
+version_block = '1 0 Open Library\nURL IP-address Archive-date Content-type Archive-length\n'
+
+class Scraper:
+    def __init__(self, recording=True):
+        self.host = 'www.amazon.com'
+        self.sock = socket.create_connection((self.host, 80))
+        self.recording = recording
+        self.cur_arc = None
+
+    def add_to_arc(self, url, start, content_type, reply):
+        d = start.strftime('%Y%m%d%H%M%S')
+        if self.cur_arc is None or os.stat(arc_dir + self.cur_arc).st_size > max_size:
+            self.cur_arc = now().strftime('%Y%m%d%H%M%S') + '.arc'
+            assert not exists(arc_dir + self.cur_arc)
+            out = open(arc_dir + self.cur_arc, 'w')
+            out.write(' '.join(['filespec://' + self.cur_arc, ip, d, 'text/plain', str(len(version_block))]) + '\n')
+            out.write(version_block)
+        else:
+            out = open(arc_dir + self.cur_arc, 'a')
+        out.write('\n' + ' '.join([url, ip, d, content_type, str(len(reply))]) + '\n')
+        out.write(reply)
+        out.close()
+
+    def get(self, url):
+        start = now()
+        send = 'GET %s HTTP/1.1\r\nHost: %s\r\nUser-Agent: Mozilla/5.0\r\nAccept-Encoding: identity\r\n\r\n' % (url, self.host)
+        self.sock.sendall(send)
+
+        fp = self.sock.makefile('rb', 0)
+        recv_buf = ''
+
+        line = fp.readline()
+        if not line.startswith('HTTP/1.1 200'):
+            print('status:', repr(line))
+        recv_buf += line
+
+        body = ''
+        content_type = None
+        charset = None
+        for line in fp: # read headers
+            recv_buf += line
+            if line.lower().startswith('transfer-encoding'):
+                assert line == 'Transfer-Encoding: chunked\r\n'
+            if line == '\r\n':
+                break
+            if line.lower().startswith('content-type'):
+                assert line.startswith(content_type_hdr)
+                assert line[-2:] == '\r\n'
+                content_type = line[len(content_type_hdr):line.find(';') if ';' in line else -2]
+                if 'charset' in line.lower():
+                    m = re_charset_header.search(line)
+                    charset = m.group(1)
+
+        while True:
+            line = fp.readline()
+            recv_buf += line
+            chunk_size = int(line, 16)
+            if chunk_size == 0:
+                break
+            chunk = fp.read(chunk_size)
+            recv_buf += chunk
+            body += chunk
+            assert chunk_size == len(chunk)
+            recv_buf += fp.read(2)
+        line = fp.readline()
+        recv_buf += line
+        fp.close()
+        if self.recording:
+            self.add_to_arc(url, start, content_type, recv_buf)
+        return body.decode(charset) if charset else body
+
+scraper = Scraper(recording=True)
+
+def get_url(params):
+    url = base_url + params
+    page = scraper.get(url)
+    return fromstring(page)
+
+def get_total(root):
+    if root.find(".//h1[@id='noResultsTitle']") is not None:
+        return 0
+    result_count = root.find(".//td[@class='resultCount']").text
+    m = re_result_count.match(result_count)
+    return int(m.group(1).replace(',', ''))
+
+def read_books(params, root):
+    # sometimes there is no link, bug at Amazaon
+    # either skip it, or reload the page
+    for i in range(5):
+        book_links = [e.find('.//a[@href]') for e in root.find_class('dataColumn')]
+        if all(a is not None for a in book_links):
+            break
+        sleep(2)
+        print('retry:', params)
+        root = get_url(params)
+    if re_child_book_param.search(params) and all(re_personalized.search(span.text) for span in root.find_class('srTitle')):
+        raise PersonalizedBooks
+    return [re_product_title.search(a.attrib['href']).group(1) for a in book_links if a is not None and a.text]
+
+def get_cats(root):
+    cats = []
+    for div in root.find_class('narrowItemHeading'):
+        if div.text != 'Department':
+            continue
+        container = div.getparent()
+        assert container.tag == 'td' and container.attrib['class'] == 'refinementContainer'
+        break
+
+    table = container.find('table')
+    for e in table.iterfind(".//div[@class='refinement']"):
+        a = e[0]
+        assert a.tag == 'a'
+        span1 = a[0]
+        assert span1.tag == 'span' and span1.attrib['class'] == 'refinementLink'
+        span2 = a[1]
+        assert span2.tag == 'span' and span2.attrib['class'] == 'narrowValue'
+        href = a.attrib['href']
+        m1 = re_rh_n.search(href)
+        if not m1:
+            print('no match:')
+            print(repr(href))
+        m2 = re_facet_count.search(span2.text)
+        cats.append((int(m1.group(1)), span1.text, int(m2.group(1).replace(',',''))))
+
+    return cats
+
+    for e in container.find('table').find_class('refinementLink'):
+        a = e.getparent()
+        assert a.tag == 'a'
+        cat = { 'url': a.attrib['href'], 'title': e.text }
+        href = a.attrib['href']
+        m = re_rh_n.search(href)
+        cats.append((int(m.group(1)), e.text))
+
+def read_page(params):
+    # read search results page
+    root = get_url(params)
+    total = get_total(root)
+    if total == 0:
+        print('no results found')
+        return total, set(), []
+    grand_total = total
+    pages = (total / page_size) + 1
+    print('total:', total, 'pages:', pages)
+
+    cats = get_cats(root)
+    print('cats 1')
+    for a, b, c in cats:
+        print("%8d %-30s %8d" % (a, b, c))
+    #return grand_total, [], cats
+
+    books = set()
+
+    books.update(read_books(params, root))
+    for page in range(2, min((pages, 100))+1):
+        params_with_page = params + "&page=%d" % page
+        books.update(read_books(params_with_page, get_url(params_with_page)))
+        print(page, len(books))
+
+    print(len(books))
+
+    cats = get_cats(root)
+    print('cats 2')
+    for a, b, c in cats:
+        print("%8d %30s %8d" % (a, b, c))
+    print('cat total:', sum(i[2] for i in cats))
+    if total > max_results:
+        for n, title, count in cats:
+            print(repr(n, title, count))
+            params_with_cat = params + ",n:" + str(n)
+            root = get_url(params_with_cat)
+            cat_total = get_total(root)
+            pages = (cat_total / page_size) + 1
+            print('cat_total:', total, 'pages:', total / page_size)
+            if cat_total > max_results:
+                print('cat_total (%d) > max results (%d)' % (total, max_results))
+    #        assert cat_total <= max_results
+            try:
+                books.update(read_books(params_with_cat, root))
+            except PersonalizedBooks:
+                print('WARNING: Personalized Books')
+                continue
+            for page in range(2, min((pages, 100)) + 1):
+                params_with_page = params_with_cat + "&page=%d" % page
+                try:
+                    books.update(read_books(params_with_page, get_url(params_with_page)))
+                except PersonalizedBooks:
+                    print('WARNING: Personalized Books')
+                    break
+                print(repr(n, title, page, cat_total / page_size, len(books), "%.1f%%" % percent(len(books), grand_total)))
+
+    return total, books, cats
+
+def write_books(books):
+    i = 0
+    error_count = 0
+
+    for asin in books:
+        i+= 1
+        for attempt in range(5):
+            try:
+                #page = urlopen('http://amazon.com/dp/' + asin).read()
+                page = scraper.get('http://www.amazon.com/dp/' + asin)
+                if re_expect_end.search(page):
+                    break
+                print('bad page ending')
+                print(repr(page[-60:]))
+                error_count += 1
+                if error_count == 50:
+                    print('too many bad endings')
+                    print('http://amazon.com/dp/' + asin)
+                    sys.exit(0)
+            except:
+                pass
+            print('retry')
+            sleep(5)
+
+if __name__ == '__main__':
+
+    one_day = timedelta(days=1)
+    cur = date(2009, 1, 1) # start date
+    cur = date(2009, 11, 11) # start date
+    #cur = date(2009, 12, 25)
+    while True:
+        print(cur)
+        total, books, cats = read_page(rh + cur.strftime("%Y%m%d"))
+        open(out_dir + '/total.' + str(cur), 'w').write(str(total) + "\n")
+
+        out = open(out_dir + "/cats." + str(cur), 'w')
+        for i in cats:
+            print(i, file=out)
+        out.close()
+        print(len(books))
+        write_books(books)
+        cur += one_day
diff --git a/ia-legacy-importer/amazon/crawl_top_books.py b/ia-legacy-importer/amazon/crawl_top_books.py
new file mode 100644
index 00000000..fe5b1528
--- /dev/null
+++ b/ia-legacy-importer/amazon/crawl_top_books.py
@@ -0,0 +1,22 @@
+from __future__ import print_function
+from openlibrary.catalog.amazon.crawl import read_page, write_books, get_url, get_cats
+
+def get_serp():
+    params = 'i:stripbooks,n:!1000,p_n_feature_browse-bin:618083011'
+
+    #crawled = set(i[:-1] for i in open('/2/edward/amazon/crawled'))
+
+    total, books, cats = read_page(params)
+    print('total:', total, 'number of books:', len(books), 'number of cats:', len(cats))
+
+#get_serp()
+
+params = 'i:stripbooks,n:9988'
+root = get_url(params)
+cats = get_cats(root)
+
+for a, b, c in cats:
+    print("%8d %-30s %8d" % (a, b, c))
+
+#books = [i[:-1] for i in open('/2/edward/amazon/best_sellers2')]
+#write_books(books)
diff --git a/ia-legacy-importer/amazon/extract_amazon_fields.py b/ia-legacy-importer/amazon/extract_amazon_fields.py
new file mode 100644
index 00000000..0cdee052
--- /dev/null
+++ b/ia-legacy-importer/amazon/extract_amazon_fields.py
@@ -0,0 +1,34 @@
+# find fields in amazon data that don't appear in MARC data, extract and store in shelve
+
+import shelve
+
+seg_file = '/home/edward/ol/amazon/seg/22'
+
+match = set(eval(line)[0] \
+    for line \
+    in open('/home/edward/ol/merge/amazon_marc/amazon_lc_map'))
+
+# fields that MARC is missing:
+# binding
+# subject
+# category
+# series
+# series_num
+# edition
+# dimensions
+# first_sentence
+# sip []
+# cap []
+# shipping_weight
+
+fields = [ 'binding', 'subject', 'category', 'series', 'series_num', 'edition',\
+    'dimensions', 'first_sentence', 'sip', 'cap', 'shipping_weight' ]
+
+d = shelve.open('amazon_fields.shelve', protocol=-1, writeback=True)
+
+for line in open(seg_file):
+    isbn, item = eval(line)
+    if isbn not in match:
+        continue
+    d[isbn] = dict([(f, item[f]) for f in fields if f in item])
+d.close
diff --git a/ia-legacy-importer/amazon/get_other_editions.py b/ia-legacy-importer/amazon/get_other_editions.py
new file mode 100644
index 00000000..bc7e1161
--- /dev/null
+++ b/ia-legacy-importer/amazon/get_other_editions.py
@@ -0,0 +1,38 @@
+from __future__ import print_function
+from catalog.read_rc import read_rc
+import web
+import sys
+import os.path
+from time import time
+
+from six.moves import urllib
+
+
+rc = read_rc()
+web.config.db_parameters = dict(dbn='postgres', db=rc['db'], user=rc['user'], pw=rc['pw'], host=rc['host'])
+web.config.db_printing = False
+web.load()
+dir = sys.argv[1]
+
+chunk = 10
+t0 = time()
+isbn_iter = web.query('select value from edition_str where key_id=30')
+for i, row in enumerate(isbn_iter):
+    isbn = row.value
+    dest = dir + '/' + isbn
+    if os.path.exists(dest):
+        continue
+    if len(isbn) != 10:
+        continue
+    url = 'http://www.amazon.com/dp/other-editions/' + isbn
+    try:
+        page = urllib.request.urlopen(url).read()
+    except urllib.error.HTTPError as error:
+        if error.code != 404:
+            raise
+        page = ''
+    open(dest, 'w').write(page)
+    if i % chunk == 0:
+        t1 = time() - t0
+        rec_per_sec = float(i) / float(t1)
+        print("%s %s %.2f rec/sec" % (url, isbn, rec_per_sec))
diff --git a/ia-legacy-importer/amazon/import.py b/ia-legacy-importer/amazon/import.py
new file mode 100644
index 00000000..a8586f0c
--- /dev/null
+++ b/ia-legacy-importer/amazon/import.py
@@ -0,0 +1,207 @@
+from __future__ import print_function
+import sys
+import re
+import os
+from parse import read_edition
+from lxml.html import fromstring
+import catalog.importer.pool as pool
+from catalog.importer.db_read import get_mc, withKey
+import catalog.merge.amazon as amazon_merge
+from catalog.get_ia import get_from_local, get_ia
+from catalog.merge.merge_marc import build_marc
+import catalog.marc.fast_parse as fast_parse
+
+import six
+from six.moves import urllib
+
+
+re_amazon = re.compile('^([A-Z0-9]{10}),(\d+):(.*)$', re.S)
+
+re_normalize = re.compile('[^\w ]')
+re_whitespace = re.compile('\s+')
+re_title_parens = re.compile('^(.+) \([^)]+?\)$')
+
+re_meta_marc = re.compile('([^/]+)_(meta|marc)\.(mrc|xml)')
+# marc:marc_ithaca_college/ic_marc.mrc:224977427:1064
+
+threshold = 875
+
+def normalize_str(s):
+    s = re_normalize.sub('', s.strip())
+    s = re_whitespace.sub(' ', s)
+    return str(s.lower())
+
+# isbn, short title
+def build_index_fields(asin, edition):
+    title = edition['title']
+    if 'subtitle' in edition:
+        title += ' ' + edition['subtitle']
+
+    def norm(s):
+        return normalize_str(s)[:25].rstrip()
+
+    titles = set([norm(title)])
+    m = re_title_parens.match(title)
+    if m:
+        titles.add(norm(m.group(1)))
+
+    isbn = set([asin])
+    for field in 'asin', 'isbn_10', 'isbn_13':
+        if field in edition:
+            isbn.add(edition[field].replace('-', ''))
+    return {'title': list(titles), 'isbn': list(isbn)}
+
+def read_amazon_file(f):
+    while True:
+        buf = f.read(1024)
+        if not buf:
+            break
+        m = re_amazon.match(buf)
+        (asin, page_len, page) = m.groups()
+        page += f.read(int(page_len) - len(page))
+        try:
+            edition = read_edition(fromstring(page))
+        except:
+            print('bad record:', asin)
+            raise
+        if not edition:
+            continue
+        yield asin, edition
+
+def follow_redirects(key):
+    keys = []
+    thing = None
+    while not thing or thing['type']['key'] == '/type/redirect':
+        keys.append(key)
+        thing = withKey(key)
+        assert thing
+        if thing['type']['key'] == '/type/redirect':
+            print('following redirect %s => %s' % (key, thing['location']))
+            key = thing['location']
+    return (keys, thing)
+
+def ia_match(a, ia):
+    try:
+        loc, rec = get_ia(ia)
+    except urllib.error.HTTPError:
+        return False
+    if rec is None or 'full_title' not in rec:
+        return False
+    try:
+        e1 = build_marc(rec)
+    except TypeError:
+        print(rec)
+        raise
+    return amazon_merge.attempt_merge(a, e1, threshold, debug=False)
+
+def marc_match(a, loc):
+    assert loc
+    rec = fast_parse.read_edition(get_from_local(loc))
+    e1 = build_marc(rec)
+    #print 'amazon:', a
+    return amazon_merge.attempt_merge(a, e1, threshold, debug=False)
+
+def source_records_match(a, thing):
+    marc = 'marc:'
+    amazon = 'amazon:'
+    ia = 'ia:'
+    match = False
+    for src in thing['source_records']:
+        if not src.startswith('marc:marc_ithaca_college/ic'):
+            m = re_meta_marc.search(src)
+            if m:
+                src = 'ia:' + m.group(1)
+        if src.startswith(marc):
+            if marc_match(a, src[len(marc):]):
+                match = True
+                break
+        elif src.startswith(ia):
+            if src == 'ia:ic':
+                print(thing['source_records'])
+            if ia_match(a, src[len(ia):]):
+                match = True
+                break
+        else:
+            assert src.startswith(amazon)
+            continue
+    return match
+
+
+def try_merge(edition, ekey, thing):
+    thing_type = thing['type']['key']
+    if 'isbn_10' not in edition:
+        print(edition)
+    asin = edition.get('isbn_10', None) or edition['asin']
+    if 'authors' in edition:
+        authors = [i['name'] for i in edition['authors']]
+    else:
+        authors = []
+    a = amazon_merge.build_amazon(edition, authors)
+    assert isinstance(asin, six.string_types)
+    assert thing_type == '/type/edition'
+    #print edition['asin'], ekey
+    if 'source_records' in thing:
+        if 'amazon:' + asin in thing['source_records']:
+            return True
+        return source_records_match(a, thing)
+
+    #print 'no source records'
+    mc = get_mc(ekey)
+    #print 'mc:', mc
+    if mc == 'amazon:' + asin:
+        return True
+    if not mc:
+        return False
+    data = get_from_local(mc)
+    e1 = build_marc(fast_parse.read_edition(data))
+    return amazon_merge.attempt_merge(a, e1, threshold, debug=False)
+
+def import_file(filename):
+    for asin, edition in read_amazon_file(open(filename)):
+        index_fields = build_index_fields(asin, edition)
+        found = pool.build(index_fields)
+        if 'title' not in found:
+            print(found)
+            print(asin)
+            print(edition)
+            print(index_fields)
+            print()
+
+        if not found['title'] and not found['isbn']:
+            #print 'no pool load book:', asin
+            # TODO load book
+            continue
+        #print asin, found
+        #print(repr(edition['title'], edition.get('subtitle', None), edition.get('flags', None), edition.get('binding', None)))
+        if 'sims' in edition:
+            del edition['sims']
+        #print edition
+        #print
+
+        seen = set()
+        for k, v in found.iteritems():
+            for ekey in v:
+                if ekey in seen:
+                    continue
+                keys, thing = follow_redirects(ekey)
+                seen.update(keys)
+                assert thing
+                try:
+                    m = try_merge(edition, ekey, thing)
+                except:
+                    print(asin)
+                    print(edition)
+                    print(ekey)
+                    print(found)
+                    raise
+
+# import_file(sys.argv[1])
+
+d = sys.argv[1]
+for f in os.listdir(d):
+    if not f.startswith('amazon.'):
+        continue
+    print(f)
+    if '2009-02' in f:
+        continue
+    import_file(d + "/" + f)
diff --git a/ia-legacy-importer/amazon/list_done.py b/ia-legacy-importer/amazon/list_done.py
new file mode 100644
index 00000000..ef1541bc
--- /dev/null
+++ b/ia-legacy-importer/amazon/list_done.py
@@ -0,0 +1,74 @@
+from __future__ import print_function
+from lxml.html import fromstring, tostring
+from openlibrary.catalog.utils.arc import read_arc, read_body
+import re
+import os
+import sys
+
+arc_dir = '/2/edward/amazon/arc'
+total = 0
+srtitle = 0
+producttitle = 0
+
+re_book_url = re.compile('^http://www.amazon.com/[^/]+/dp/([0-9A-Z]{10})/')
+re_result_count = re.compile('^Showing ([,0-9]+) - ([,0-9]+) of ([,0-9]+) Results$')
+
+bad_serp = 0
+
+out = open('/2/edward/amazon/crawled2', 'w')
+
+for filename in (i for i in os.listdir(arc_dir) if i.endswith('.arc')):
+    print(filename, total, srtitle, producttitle)
+    for url, wire in read_arc(arc_dir +'/' + filename):
+        if url.startswith('file'):
+            continue
+        if not url.startswith('http://www.amazon.com/s?'):
+            continue
+        body = read_body(wire)
+        doc = fromstring(body)
+        found = []
+        try:
+            doc.get_element_by_id('noResultsTitle')
+#            print 'no results:', url
+            continue
+        except KeyError:
+            pass
+        rc = doc.find_class('resultCount')
+        if rc:
+            m = re_result_count.match(rc[0].text)
+            if m:
+                (a, b, c) = map(lambda i: int(i.replace(',','')), m.groups())
+                if a == c + 1 and b == c:
+#                    print 'result count:', rc[0].text
+#                    print 'empty page'
+                    continue
+        for e in doc.find_class('fastTrackList'):
+            if e.text == 'This item is currently not available.':
+                print(e.text)
+
+        for pt in doc.find_class('productTitle'):
+            assert pt.tag == 'div'
+            assert pt[0].tag == 'a'
+            href = pt[0].attrib['href']
+            m = re_book_url.match(href)
+            found.append(m.group(1))
+            total += 1
+            producttitle += 1
+
+        for e in doc.find_class('srTitle'):
+            td = e.getparent().getparent()
+            assert td.tag == 'td'
+            assert td[0].tag == 'a'
+            href = td[0].attrib['href']
+            m = re_book_url.match(href)
+            found.append(m.group(1))
+            total += 1
+            srtitle += 1
+
+        if len(found) == 0:
+            print(url)
+            bad_serp += 1
+            open('bad_serp%d.html' % bad_serp, 'w').write(body)
+        for asin in found:
+            print(asin, file=out)
+out.close()
diff --git a/ia-legacy-importer/amazon/load_merge.py b/ia-legacy-importer/amazon/load_merge.py
new file mode 100644
index 00000000..82b20382
--- /dev/null
+++ b/ia-legacy-importer/amazon/load_merge.py
@@ -0,0 +1,135 @@
+from __future__ import print_function
+from time import time
+from catalog.marc.MARC21 import MARC21Record
+from catalog.marc.parse import pick_first_date
+
+from six.moves import urllib
+
+
+entity_fields = ('name', 'birth_date', 'death_date', 'date')
+
+def find_entity(site, entity):
+    entity = dict((k, entity[k]) for k in entity_fields if k in entity)
+    print(entity)
+    things = site.things(entity)
+    if not things:
+        print("person not found")
+        return
+
+    print("found", len(things), "match")
+    for key in things:
+        db_entity = site.withKey(key, lazy=False)._get_data()
+        for field in entity_fields:
+            if field in entity:
+                assert field in db_entity
+            else:
+                assert field not in db_entity
+
+def get_from_archive(locator):
+    (file, offset, length) = locator.split (":")
+    offset = int (offset)
+    length = int (length)
+
+    r0, r1 = offset, offset+length-1
+    url = 'http://www.archive.org/download/%s'% file
+
+    assert 0 < length < 100000
+
+    ureq = urllib.request.Request(url, None, {'Range':'bytes=%d-%d'% (r0, r1)},)
+    result = urllib.request.urlopen(ureq).read(100000)
+    rec = MARC21Record(result)
+    return rec
+
+def contrib(r):
+    contribs = []
+    for f in r.get_fields('700'):
+        print(f.subfield_sequence)
+        contrib = {}
+        if 'a' not in f.contents and 'c' not in f.contents:
+            continue # should at least be a name or title
+        name = " ".join([j.strip(' /,;:') for i, j in f.subfield_sequence if i in 'abc'])
+        if 'd' in f.contents:
+            contrib = pick_first_date(f.contents['d'])
+            contrib['db_name'] = ' '.join([name] + f.contents['d'])
+        else:
+            contrib['db_name'] = name
+        contrib['name'] = name
+        contrib['entity_type'] = 'person'
+        subfields = [
+            ('a', 'personal_name'),
+            ('b', 'numeration'),
+            ('c', 'title')
+        ]
+        for subfield, field_name in subfields:
+            if subfield in f.contents:
+                contrib[field_name] = ' '.join([x.strip(' /,;:') for x in f.contents[subfield]])
+        if 'q' in f.contents:
+            contrib['fuller_name'] = ' '.join(f.contents['q'])
+        contribs.append(contrib)
+
+    for f in r.get_fields('710'):
+        print(f.subfield_sequence)
+        contrib = {
+            'entity_type': 'org',
+            'name': " ".join([j.strip(' /,;:') for i, j in f.subfield_sequence if i in 'ab'])
+        }
+        contrib['db_name'] = contrib['name']
+        contribs.append(contrib)
+
+    for f in r.get_fields('711'):
+        print(f.subfield_sequence)
+        contrib = {
+            'entity_type': 'event',
+            'name': " ".join([j.strip(' /,;:') for i, j in f.subfield_sequence if i in 'acdn'])
+        }
+        contrib['db_name'] = contrib['name']
+        contribs.append(contrib)
+    return contribs
+
+def load(site, filename):
+    for line in open(filename):
+        isbn, lc_src, amazon = eval(line)
+        versions = site.versions({'machine_comment': lc_src})
+        assert len(versions) == 1
+        thing = site.withID(versions[0]['thing_id'])
+
+        if 'authors' not in amazon:
+            continue
+        author_count = 0
+        for name, role in amazon['authors']:
+            if role != 'Author':
+                continue
+            author_count+=1
+            if author_count > 1:
+                break
+        if author_count < 2:
+            continue
+
+        print(lc_src)
+        print('amazon:', amazon['authors'])
+
+
+        try:
+            print('LC authors:', [x.name for x in thing.authors])
+        except AttributeError:
+            print('no authors in LC')
+        lc_contrib = []
+        try:
+            lc_contrib = thing.contributions
+            print('LC contributions:', lc_contrib)
+        except AttributeError:
+            print('no contributions in LC')
+        if lc_contrib:
+            r = get_from_archive(lc_src)
+            contrib_detail = contrib(r)
+            assert len(lc_contrib) == len(contrib_detail)
+            for c, detail in zip(lc_contrib, contrib_detail):
+                print(c, end=' ')
+                find_entity(site, detail)
+        print()
+        continue
+    #    for x in web.query("select thing_id from version where machine_comment=" + web.sqlquote(lc)):
+    #        t = site.withID(x.thing_id)
+    #        print t.title
+
+
diff --git a/ia-legacy-importer/amazon/other_editions.py b/ia-legacy-importer/amazon/other_editions.py
new file mode 100644
index 00000000..dc367517
--- /dev/null
+++ b/ia-legacy-importer/amazon/other_editions.py
@@ -0,0 +1,66 @@
+import re
+import os.path
+from bs4 import BeautifulSoup
+
+from six.moves import urllib
+
+
+# http://amazon.com/other-editions/dp/0312153325 has:
+# http://www.amazon.com/gp/product/0312247869
+re_link = re.compile('^http://www\.amazon\.com/(?:(.*)/dp|gp/product)/(\d{9}[\dX]|B[A-Z0-9]+)$')
+
+desc_skip = set(['(Bargain Price)', '(Kindle Book)'])
+
+def read_bucket_table(f):
+    html = ''
+    bucket = False
+    table = False
+    for line in f:
+        if line[:-1] == '<div class="bucket">':
+            bucket = True
+            continue
+        if bucket and line[:-1] == '   <table border="0" cellpadding="2" cellspacing="0">':
+            table = True
+        if table:
+            html += line
+            if line[:-1] == '   </table>':
+                break
+    return html
+
+def parse_html(html):
+    soup = BeautifulSoup(html, "lxml")
+    for tr in soup('tr')[2:]:
+        td = tr('td')
+        assert len(td) == 3
+        td0 = td[0]
+        assert td0['class'] == 'small'
+        assert len(td0) == 3
+        (nl, link, desc) = td0
+        assert nl == '\n'
+        href = link['href']
+        if href.startswith("http://www.amazon.com:80/gp/redirect.html"):
+            # audio book, skip for now
+            continue
+        m = re_link.match(link['href'])
+        yield str(m.group(2)), desc.strip()
+
+def get_from_amazon(isbn):
+    url = 'http://www.amazon.com/dp/other-editions/' + isbn
+    try:
+        return urllib.request.urlopen(url).read()
+    except urllib.error.HTTPError as error:
+        if error.code != 404:
+            raise
+        return ''
+
+def find_others(isbn, dir):
+    filename = dir + "/" + isbn
+    if len(isbn) != 10:
+        return []
+    if not os.path.exists(filename):
+        open(filename, 'w').write(get_from_amazon(isbn))
+    html = read_bucket_table(open(dir + "/" + isbn))
+    if not html:
+        return []
+    l = [i for i in parse_html(html) if not i[0].startswith('B') and i[1] not in desc_skip]
+    return l
diff --git a/ia-legacy-importer/amazon/parse.py b/ia-legacy-importer/amazon/parse.py
new file mode 100644
index 00000000..f4d940b3
--- /dev/null
+++ b/ia-legacy-importer/amazon/parse.py
@@ -0,0 +1,626 @@
+from __future__ import print_function
+from lxml.html import parse, tostring
+import re
+import os
+import sys
+import web
+from warnings import warn
+from math import floor
+from pprint import pprint
+import htmlentitydefs
+
+import six
+
+
+class BrokenTitle(Exception):
+    pass
+
+class IncompletePage(Exception):
+    pass
+
+class MissingAuthor(Exception):
+    pass
+
+role_re = re.compile("^ \(([^)]+)\)")
+
+#: sample: ' [Paperback, Large Print]'
+
+re_title = re.compile("""
+    (?:\ \[([A-Za-z, ]+)\])? # flags
+    (?:\(\ ([^()]+|[^()]*\(.*\)[^()]*)\))?
+    """, re.MULTILINE | re.X)
+
+re_split_title = re.compile(r'''^
+    (.+?(?:\ \(.+\))?)
+    (?::\ (\ *[^:]+))?$
+''', re.X)
+
+re_missing_author = re.compile('\n\n(~  )?\(([A-Za-z, ]+)\), ')
+
+re_list_price = re.compile('^\$([\d,]+)\.(\d\d)$')
+re_amazon_price = re.compile('^\$([\d,]+)\.(\d\d)$')
+# '$0.04\n      \n    '
+re_you_save = re.compile('^\$([\d,]+)\.(\d\d)\s*\((\d+)%\)\s*$')
+
+re_pages = re.compile('^\s*(\d+)(?:\.0)? pages\s*$')
+re_sales_rank = re.compile('^ #([0-9,]+) in Books')
+re_html_in_title = re.compile('</?(i|em|br)>', re.I)
+
+def unescape(text):
+    def fixup(m):
+        text = m.group(0)
+        if text[:2] == "&#":
+            # character reference
+            try:
+                if text[:3] == "&#x":
+                    return six.unichr(int(text[3:-1], 16))
+                else:
+                    return six.unichr(int(text[2:-1]))
+            except ValueError:
+                pass
+        else:
+            # named entity
+            try:
+                text =  six.unichr(htmlentitydefs.name2codepoint[text[1:-1]])
+            except KeyError:
+                pass
+        return text # leave as is
+    return re.sub("&#?\w+;", fixup, text)
+
+def to_dict(k, v):
+    return {k: v} if v else None
+
+def read_authors(by_span):
+    authors = []
+    if re_missing_author.match(by_span.text):
+        raise MissingAuthor
+    try:
+        assert by_span.text in ('\n\n', '\n\n~ ')
+    except:
+        print(repr(by_span.text))
+        raise
+    expect_end = False
+    for e in by_span:
+        if expect_end:
+            assert e.tag in ('br', 'span')
+            break
+        assert e.tag == 'a'
+        if e.tail.endswith('\n\n'):
+            expect_end = True
+        else:
+            assert e.tail.endswith(', ')
+        m = role_re.match(e.tail)
+        if m:
+            authors.append({ 'name': e.text, 'role': m.group(1), 'href': e.attrib['href'] })
+        else:
+            authors.append({ 'name': e.text, 'href': e.attrib['href'] })
+    return authors
+
+def get_title_and_authors(doc, title_from_html):
+    try:
+        prodImage = doc.get_element_by_id('prodImage')
+    except KeyError:
+        raise IncompletePage
+    full_title = unescape(prodImage.attrib['alt']) # double quoted
+    full_title = re_html_in_title.sub('', full_title).replace('&apos;', "'")
+
+    m = re_split_title.match(full_title)
+    (title, subtitle) = m.groups()
+    # maybe need to descape title
+    title_id = doc.get_element_by_id('btAsinTitle')
+    assert title_id.tag == 'span'
+    assert title_id.getparent().tag == 'h1'
+    assert title_id.getparent().attrib['class'] == 'parseasinTitle'
+    buying_div = title_id.getparent().getparent()
+    assert buying_div.tag == 'div'
+    assert buying_div.attrib['class'] == 'buying'
+    by_span = buying_div[1]
+    assert by_span.tag == 'span'
+
+    book = {
+        'full_title': full_title,
+        'title': title,
+        'has_cover_img': "no-image-avail" not in prodImage.attrib['src']
+    }
+
+    authors = []
+    if len(by_span) and by_span[0].tag == 'a':
+        #print len(by_span), [e.tag for e in by_span]
+        book['authors'] = read_authors(by_span)
+    title_text = title_id.text_content()
+    if not title_text.startswith(full_title):
+        print(('alt:', repr(prodImage.attrib['alt'])))
+        print(('title mistmach:', repr(full_title), '!=', repr(title_text)))
+        title_text = title_from_html.decode('latin-1')
+        print(('title_text:', repr(title_text)))
+        print(('full_title:', repr(full_title)))
+    if not title_text.startswith(full_title):
+        print(('alt:', repr(prodImage.attrib['alt'])))
+        print(('title mistmach:', repr(full_title), '!=', repr(title_text)))
+        raise BrokenTitle
+    if full_title != title_text:
+        btAsinTitle = title_text[len(full_title):]
+        m = re_title.match(btAsinTitle)
+        if not m:
+            print(('title:', repr(btAsinTitle)))
+        (flag, binding) = m.groups()
+        if binding is not None:
+            book['binding'] = binding
+        if flag:
+            book['flag'] = flag
+    if subtitle:
+        book['subtitle'] = subtitle
+
+    return book
+
+def dollars_and_cents(dollars, cents):
+    # input: dollars and cents as strings
+    # output: value in cents as an int
+    return int(dollars.replace(',', '')) * 100 + int(cents)
+
+def read_price_block(doc):
+    price_block = doc.get_element_by_id('priceBlock', None)
+    book = {}
+    if price_block is None:
+        return
+    assert price_block.tag == 'div' and price_block.attrib['class'] == 'buying'
+    table = price_block[0]
+    assert table.tag == 'table' and table.attrib['class'] == 'product'
+    for tr in table:
+        assert tr.tag == 'tr' and len(tr) == 2
+        assert all(td.tag == 'td' for td in tr)
+        heading = tr[0].text
+        value = tr[1].text_content()
+
+        if heading == 'List Price:':
+            m = re_list_price.match(value)
+            list_price = dollars_and_cents(m.group(1), m.group(2))
+            book["list_price"] = list_price
+        elif heading == "Price:":
+            b = tr[1][0]
+            assert b.tag == 'b' and b.attrib['class'] == 'priceLarge'
+            m = re_amazon_price.match(b.text)
+            amazon_price = dollars_and_cents(m.group(1), m.group(2))
+            book["amazon_price"] = amazon_price
+        elif heading == 'You Save:':
+            continue # don't need to check
+            # fails for 057124954X: '$0.04\n      \n    '
+            m = re_you_save.match(value)
+            you_save = dollars_and_cents(m.group(1), m.group(2))
+            assert list_price - amazon_price == you_save
+            assert floor(float(you_save * 100) / list_price + 0.5) == int(m.group(3))
+        elif heading == 'Value Priced at:':
+            continue # skip
+            m = re_amazon_price.match(value)
+            book["value_priced_at"] = dollars_and_cents(m.group(1), m.group(2))
+        elif heading == 'Import List Price:':
+            pass
+
+    return book
+
+def find_avail_span(doc):
+    for div in doc.find_class('buying'):
+        if div.tag != 'div' or not len(div):
+            continue
+        if div[0].tag == 'span':
+            span = div[0]
+        elif div[0].tag == 'br' and div[1].tag == 'b' and div[2].tag == 'span':
+            span = div[2]
+        else:
+            continue
+        if span.attrib['class'].startswith('avail'):
+            return span
+
+def read_avail(doc):
+    traffic_signals = set(['Red', 'Orange', 'Green'])
+    span = find_avail_span(doc)
+    color = span.attrib['class'][5:]
+    assert color in traffic_signals
+    gift_wrap = span.getnext().getnext().tail
+    book = {
+        'avail_color': color,
+        'amazon_availability': span.text,
+        'gift_wrap': bool(gift_wrap) and 'Gift-wrap available' in gift_wrap
+    }
+    return book
+
+def read_other_editions(doc):
+    oe = doc.get_element_by_id('oeTable', None)
+    if oe is None:
+        return
+    assert oe.tag == 'table' and oe.attrib['class'] == 'otherEditions'
+    assert len(oe) == 2 and len(oe[0]) == 2 and len(oe[1]) == 2
+    assert oe[0][0][0].tag == 'a'
+    oe = oe[0][0][1]
+    assert oe.tag == 'table'
+    other_editions = []
+    for tr in oe[1:]:
+        assert tr.tag == 'tr'
+        if 'bgcolor' in tr.attrib:
+            assert tr.attrib['bgcolor'] == '#ffffff'
+        else:
+            assert tr[0].attrib['id'] == 'oeShowMore'
+            break
+        assert tr[0].attrib['class'] == 'tiny'
+        a = tr[0][0]
+        assert a.tag == 'a'
+        row = [a.attrib['href'][-10:], a.text, a.tail.strip()]
+        other_editions.append(row)
+    return {'other_editions': other_editions }
+
+def read_sims(doc):
+    sims = doc.find_class('sims-faceouts')
+    if len(sims) == 0:
+        return
+    assert len(sims) == 1
+    sims = sims[0]
+    assert sims.tag == 'table'
+    found = []
+    if sims[0].tag == 'tbody':
+        tr = sims[0][0]
+    else:
+        assert sims[0].tag == 'tr'
+        tr = sims[0]
+    for td in tr:
+        assert td.tag == 'td'
+        a = td[1][0]
+        assert a.tag == 'a'
+        found.append({'asin': a.attrib['href'][-10:], 'title': a.text})
+    return to_dict('sims', found)
+
+def find_product_details_ul(doc):
+    a = doc.get_element_by_id('productDetails', None)
+    if a is None:
+        return
+    try:
+        assert a.tag == 'a' and a.attrib['name'] == 'productDetails'
+    except:
+        print(tostring(a))
+        raise
+    hr = a.getnext()
+    assert hr.tag == 'hr' and hr.attrib['class'] == 'bucketDivider'
+    table = hr.getnext()
+    td = table[0][0]
+    assert td.tag == 'td' and td.attrib['class'] == 'bucket'
+    h2 = td[0]
+    assert h2.tag == 'h2' and h2.text == 'Product Details'
+    div = td[1]
+    assert div.tag == 'div' and div.attrib['class'] == 'content'
+    ul = div[0]
+    if div[0].tag == 'table':
+        ul = div[1]
+    assert ul.tag == 'ul'
+    assert ul[-1].tag == 'div' and ul[-2].tag == 'p'
+    return ul
+
+def read_li(li):
+    assert li.tag == 'li'
+    b = li[0]
+    assert b.tag == 'b'
+    return b
+
+re_series = re.compile('^<li>(?:This is item <b>(\d+)</b> in|This item is part of) <a href="?/gp/series/(\d+).*?><b>The <i>(.+?)</i> Series</b></a>\.</li>')
+
+def read_series(doc):
+    ul = doc.find_class('linkBullets')
+    if len(ul) == 0:
+        return
+    assert len(ul) == 1
+    ul = ul[0]
+    if len(ul) == 0:
+        return
+    li = ul[0]
+    assert li.tag == 'li'
+    (series_num, series_id, series) = re_series.match(tostring(li)).groups()
+    found = {}
+    if series_num:
+        found["series_num"] = int(series_num)
+    found["series"] = series
+    found["series_id"] = series_id
+    return found
+
+def read_product_details(doc):
+    ul = find_product_details_ul(doc)
+    if ul is None:
+        return
+
+    headings = {
+        'Publisher': 'publisher',
+        'Language': 'language',
+        'ISBN-10': 'isbn_10',
+        'ISBN-13': 'isbn_13',
+        'ASIN': 'asin',
+        'Product Dimensions': 'dimensions',
+        'Shipping Weight': 'shipping_weight',
+    }
+
+    found = {}
+    ul_start = 0
+    if 'Reading level' in ul[0][0].text:
+        ul_start = 1
+        li = ul[0]
+        b = read_li(li)
+        found['reading_level'] = b.tail.strip()
+
+    li = ul[ul_start]
+    b = read_li(li)
+    (binding, pages) = (b.text, b.tail)
+    if binding[-1] == ':':
+        binding = binding[:-1]
+    found['binding'] = binding
+    if pages:
+        m = re_pages.match(pages)
+        if m:
+            found['number_of_pages'] = int(m.group(1))
+        else:
+            warn("can't parse number_of_pages: " + pages)
+
+    seen_average_customer_review = False
+    for li in ul[ul_start + 1:-2 if ul[-3].tag != 'br' else -3]:
+#        if li.tag == 'p' and len(li) == 0:
+#            continue
+        b = read_li(li)
+        h = b.text.strip(': \n')
+        if h in ('Also Available in', 'In-Print Editions'):
+            break
+        if seen_average_customer_review:
+            break
+        if h == 'Amazon.com Sales Rank':
+            m = re_sales_rank.match(b.tail)
+            found['sales_rank'] = int(m.group(1).replace(",", ""))
+            break
+        if h in ('Shipping Information', 'Note', 'Shipping'):
+            continue
+        if h == 'Average Customer Review':
+            seen_average_customer_review = True
+            continue
+        if h == 'Shipping Weight':
+            found['shipping_weight'] = b.tail.strip('( ')
+            continue
+        heading = headings[h]
+        found[heading] = b.tail.strip()
+    return found
+
+re_pub_date = re.compile("^(.*) \((.*\d{4})\)$")
+re_pub_edition = re.compile("^(.*); (.*)$")
+
+def parse_publisher(edition):
+    if 'publisher' in edition:
+        m = re_pub_date.match(edition["publisher"])
+        if m:
+            edition["publisher"] = m.group(1)
+            edition["publish_date"] = m.group(2)
+        m = re_pub_edition.match(edition["publisher"])
+        if m:
+            edition["publisher"] = m.group(1)
+            edition["edition"] = m.group(2)
+
+re_latest_blog_posts = re.compile('\s*(.*?) latest blog posts')
+re_plog_link = re.compile('^/gp/blog/([A-Z0-9]+)$')
+
+def read_plog(doc):
+    div = doc.get_element_by_id('plog', None)
+    if div is None:
+        return
+    assert div.tag == 'div' and div.attrib['class'] == 'plog'
+    table = div[1]
+    b = table[0][0][0]
+    assert b.tag == 'b' and b.attrib['class'] == 'h1'
+    m = re_latest_blog_posts.match(b.text)
+    name = m.group(1)
+    found = {}
+    if name.endswith("'s"):
+        found["plog_name"] = name[:-2]
+    else:
+        assert name.endswith("s'")
+        found["plog_name"] = name[:-1]
+    div = table[2][1][0]
+    found["plog_img"] = div[0].attrib['src'].replace(".T.", ".L.")
+    ul = div[-1]
+    assert ul.tag == 'ul' and ul.attrib['class'] == 'profileLink'
+    li = ul[0]
+    assert li.tag == 'li' and li.attrib['class'] == 'carat'
+    assert li[0].tag == 'a'
+
+    href = li[0].attrib['href']
+    m = re_plog_link.match(href)
+    found["plog_id"] = m.group(1)
+
+    return found
+
+re_cite = {
+    'citing': re.compile('\nThis book cites (\d+) \nbook(?:s)?:'),
+    'cited': re.compile('\n(\d+) \nbook(?:s)? \ncites? this book:')
+}
+
+def read_citing(doc):
+    div = doc.get_element_by_id('bookCitations', None)
+    found = {}
+    if div is None:
+        return
+    content = div[0][2]
+    assert content.tag == 'div' and content.attrib['class'] == 'content'
+    a = content[0]
+    assert a.tag == 'a'
+    b = content[1]
+    name = a.attrib['name']
+    assert name in ('citing', 'cited')
+    found[name] = b.text
+    if len(content) > 7:
+        print(len(content))
+        for num, i in enumerate(content):
+            print(num, i.tag, i.attrib)
+        a = content[8]
+        assert a.tag == 'a'
+        b = content[9]
+        assert a.attrib['name'] == 'cited'
+        found['cited'] = b.text
+    for k, v in found.items():
+        m = re_cite[k].match(v)
+        found[k] = int(m.group(1))
+    return found
+
+def find_inside_this_book(doc):
+    for b in doc.find_class('h1'):
+        if b.text == 'Inside This Book':
+            assert b.tag == 'b'
+            return b.getparent()
+    return None
+
+def read_first_sentence(inside):
+    if len(inside) == 4:
+        assert inside[2].tag == 'span'
+        assert inside[2].attrib['class'] == 'tiny'
+        assert inside[2][0].tail.strip() == 'Browse and search another edition of this book.'
+        div = inside[3]
+    else:
+        assert len(inside) == 3
+        div = inside[2]
+    assert div.tag == 'div' and div.attrib['class'] == 'content'
+    if div[0].tag in ('a', 'b'):
+        assert div[0].text != 'First Sentence:'
+        return
+    assert div[0].tag == 'strong'
+    assert div[0].text == 'First Sentence:'
+    assert div[1].tag == 'br'
+    return div[1].tail.strip(u"\n \xa0")
+
+def find_bucket(doc, text):
+    for div in doc.find_class('bucket'):
+        h2 = div[0]
+        if h2.tag == 'h2' and h2.text == text:
+            return div
+    return None
+
+# New & Used Textbooks
+
+def read_subject(doc):
+    div = find_bucket(doc, 'Look for Similar Items by Subject')
+    if div is None:
+        return
+    assert div.tag == 'div'
+    form = div[1][0]
+    assert form.tag == 'form'
+    input = form[0]
+    assert input.tag == 'input' and input.attrib['type'] == 'hidden' \
+        and input.attrib['name'] == 'index' \
+        and input.attrib['value'] == 'books'
+    found = []
+    for input in form[3:-4:3]:
+        a = input.getnext()
+        assert a.tag == 'a'
+        found_text = a.text if len(a) == 0 else a[0].text
+        assert found_text is not None
+        found.append(found_text)
+    return to_dict('subjects', found)
+
+def read_category(doc):
+    div = find_bucket(doc, 'Look for Similar Items by Category')
+    if div is None:
+        return
+    assert div.tag == 'div'
+    ul = div[1][0]
+    assert ul.tag == 'ul'
+    found = []
+    for li in ul:
+        assert all(a.tail == ' > ' for a in li[:-1])
+        cat = [a.text for a in li]
+        if cat[-1] == 'All Titles':
+            cat.pop()
+        found.append(tuple(cat))
+#        if 'Series' in cat:
+#            edition["series2"] = cat
+    # maybe strip 'Books' from start of category
+    found = [i[1:] if i[0] == 'Books' else i for i in found]
+    return to_dict('category', found)
+
+def read_tags(doc):
+    table = doc.find_class('tag-cols')
+    if len(table) == 0:
+        return
+    assert len(table) == 1
+    table = table[0]
+    assert len(table) == 1
+    tr = table[0]
+
+def read_edition(doc, title_from_html=None):
+    edition = {}
+    book = get_title_and_authors(doc, title_from_html)
+    edition.update(book)
+
+    ret = read_price_block(doc)
+    if ret:
+        edition.update(ret)
+    inside = find_inside_this_book(doc)
+    if inside is not None:
+        sentence = read_first_sentence(inside)
+        if sentence:
+            edition['first_sentence'] = sentence
+    func = [
+        #read_citing,
+        read_plog,
+        read_series,
+        #read_avail,
+        read_product_details,
+        read_other_editions,
+        #read_sims, # not needed now
+        read_subject,
+        read_category,
+    ]
+    for f in func:
+        ret = f(doc)
+        if ret:
+            edition.update(ret)
+    parse_publisher(edition)
+    if 'isbn_10' not in edition and 'asin' not in edition:
+        return None
+    return edition
+
+# ['subtitle', 'binding', 'shipping_weight', 'category', 'first_sentence',  'title', 'full_title', 'authors', 'dimensions', 'publisher', 'language', 'number_of_pages', 'isbn_13', 'isbn_10', 'publish_date']
+def edition_to_ol(edition):
+    ol = {}
+    fields = ['title', 'subtitle', 'publish_date', 'number_of_pages', 'first_sentence']
+    for f in fields:
+        if f in edition:
+            ol[f] = edition[f]
+    if 'isbn_10' in edition:
+        ol['isbn_10'] = [edition['isbn_10']]
+    if 'isbn_13' in edition:
+        ol['isbn_13'] = [edition['isbn_13'].replace('-','')]
+    if 'category' in edition:
+        ol['subjects'] = edition['category']
+    if 'binding' in edition:
+        ol['physical_format'] = edition['binding']
+    if 'dimensions' in edition:
+        ol['physical_dimensions'] = edition['dimensions']
+    if 'shipping_weight' in edition:
+        ol['weight'] = edition['shipping_weight']
+    if 'authors' in edition:
+        ol['authors'] = [a for a in edition['authors'] if a['name'] != 'n/a']
+    if 'publisher' in edition:
+        ol['publishers'] = [edition['publisher']]
+    else:
+        print('publisher missing')
+
+    for k, v in ol.iteritems():
+        if isinstance(v, six.string_types) and v[-1] == '(':
+            pprint(edition)
+            print(('ends with "(":', repr(k, v)))
+            sys.exit(0)
+
+    return ol
+
+if __name__ == '__main__':
+    #for dir in ('/2008/sample/', 'pages/'):
+    page_dir = sys.argv[1]
+    for filename in os.listdir(page_dir):
+        #if '1435438671' not in filename:
+        #    continue
+        if filename.endswith('.swp'):
+            continue
+        edition = {}
+        doc = parse(page_dir + '/' + filename).getroot()
+        assert doc is not None
+        edition = read_edition(doc)
+        ol = edition_to_ol(edition)
+        pprint (ol)
diff --git a/ia-legacy-importer/amazon/read_serp.py b/ia-legacy-importer/amazon/read_serp.py
new file mode 100644
index 00000000..a5b6ec38
--- /dev/null
+++ b/ia-legacy-importer/amazon/read_serp.py
@@ -0,0 +1,79 @@
+from __future__ import print_function
+from lxml.html import fromstring
+from openlibrary.catalog.utils.arc import read_arc, read_body
+import os
+import re
+
+arc_dir = '/2/edward/amazon/arc'
+
+re_book_url = re.compile('^http://www.amazon.com/[^/]+/dp/([0-9A-Z]{10})/')
+re_result_count = re.compile('^Showing ([,0-9]+) - ([,0-9]+) of ([,0-9]+) Results$')
+re_title = re.compile('<title>Amazon.com: (.*?)(:?, Page \d+)?</title>')
+crawled = set(i[:-1] for i in open('/2/edward/amazon/crawled'))
+
+# /2/edward/amazon/arc/20100311*.arc
+
+def find_pt(doc):
+    found = []
+    for pt in doc.find_class('productTitle'):
+        assert pt.tag == 'div'
+        assert pt[0].tag == 'a'
+        href = pt[0].attrib['href']
+        m = re_book_url.match(href)
+        print(m.group(1))
+        found.append(m.group(1))
+    return found
+
+def find_srtitle(doc):
+    found = []
+    for e in doc.find_class('srTitle'):
+        td = e.getparent().getparent()
+        assert td.tag == 'td'
+        assert td[0].tag == 'a'
+        href = td[0].attrib['href']
+        m = re_book_url.match(href)
+        found.append(m.group(1))
+    return found
+
+found_books = set()
+
+prev = ''
+for filename in (i for i in os.listdir(arc_dir) if i.endswith('.arc')):
+    if not filename.startswith('20100412'):
+        continue
+    for url, wire in read_arc(arc_dir +'/' + filename):
+        #print filename, url
+        if url.startswith('file'):
+            continue
+        if not url.startswith('http://www.amazon.com/s?'):
+            continue
+        body = read_body(wire)
+        m = re_title.search(body)
+        if m.group(1) != prev:
+            print(m.group(1))
+            prev = m.group(1)
+        continue
+        doc = fromstring(body)
+        try:
+            doc.get_element_by_id('noResultsTitle')
+            continue
+        except KeyError:
+            pass
+        rc = doc.find_class('resultCount')
+        if rc:
+            m = re_result_count.match(rc[0].text)
+            if m:
+                (a, b, c) = map(lambda i: int(i.replace(',','')), m.groups())
+                if a == c + 1 and b == c:
+                    continue
+        for e in doc.find_class('fastTrackList'):
+            if e.text == 'This item is currently not available.':
+                print(e.text)
+
+        assert len(find_pt(doc)) == 0
+        serp_found = find_srtitle(doc)
+        for asin in serp_found:
+            if asin in crawled:
+                continue
+        found_books.update(serp_found)
+        print(len(serp_found), len(found_books), filename, url)
diff --git a/ia-legacy-importer/amazon/upload.py b/ia-legacy-importer/amazon/upload.py
new file mode 100644
index 00000000..a15dc4b9
--- /dev/null
+++ b/ia-legacy-importer/amazon/upload.py
@@ -0,0 +1,89 @@
+from __future__ import print_function
+from catalog.read_rc import read_rc
+import httplib
+import web
+import time
+import sys
+from datetime import date, timedelta
+
+rc = read_rc()
+accesskey = rc['s3_accesskey']
+secret = rc['s3_secret']
+
+db = web.database(dbn='mysql', host=rc['ia_db_host'], user=rc['ia_db_user'], \
+        passwd=rc['ia_db_pass'], db='archive')
+db.printing = False
+
+crawl_dir = '/1/edward/amazon/crawl'
+collection = 'ol_data'
+mediatype = 'data'
+
+con = httplib.HTTPConnection('s3.us.archive.org')
+con.connect()
+
+def wait_for_upload(ia):
+    while True:
+        rows = list(db.select('catalog', where='identifier = $ia', vars={'ia': ia}))
+        if len(rows) == 0:
+            return
+        print("\r", len(rows), 'tasks still running', end=' ')
+        time.sleep(5)
+    print('\ndone')
+
+no_bucket_error = '<Code>NoSuchBucket</Code>'
+internal_error = '<Code>InternalError</Code>'
+
+def put_file(con, ia, filename, headers):
+    print('uploading %s' % filename)
+    headers['authorization'] = "LOW " + accesskey + ':' + secret
+    url = 'http://s3.us.archive.org/' + ia + '/' + filename
+    print(url)
+    data = open(crawl_dir + '/' + filename).read()
+    for attempt in range(5):
+        con.request('PUT', url, data, headers)
+        res = con.getresponse()
+        body = res.read()
+        if '<Error>' not in body:
+            return
+        print('error')
+        print(body)
+        if no_bucket_error not in body and internal_error not in body:
+            sys.exit(0)
+        print('retry')
+        time.sleep(5)
+    print('too many failed attempts')
+
+def create_item(con, ia, cur_date):
+    headers = {
+        'x-amz-auto-make-bucket': 1,
+        'x-archive-meta01-collection': collection,
+        'x-archive-meta-mediatype': mediatype,
+        'x-archive-meta-language': 'eng',
+        'x-archive-meta-title': 'Amazon crawl ' + cur_date,
+        'x-archive-meta-description': 'Crawl of Amazon. Books published on ' + cur_date + '.',
+        'x-archive-meta-year': cur_date[:4],
+        'x-archive-meta-date': cur_date.replace('-', ''),
+    }
+
+    filename =  'index.' + cur_date
+    put_file(con, ia, filename, headers)
+
+def upload_index(con, cur_date):
+    ia = 'amazon_crawl.' + cur_date
+
+    create_item(con, ia, cur_date)
+    wait_for_upload(ia)
+    time.sleep(5)
+
+    put_file(con, ia, 'amazon.' + cur_date, {})
+    put_file(con, ia, 'cats.' + cur_date, {})
+    put_file(con, ia, 'list.' + cur_date, {})
+
+one_day = timedelta(days=1)
+cur = date(2009, 4, 26) # start from
+while True:
+    print(cur)
+    upload_index(con, str(cur))
+    cur -= one_day
+
+con.close()
diff --git a/ia-legacy-importer/amazon/upload_arc.py b/ia-legacy-importer/amazon/upload_arc.py
new file mode 100644
index 00000000..45ae5663
--- /dev/null
+++ b/ia-legacy-importer/amazon/upload_arc.py
@@ -0,0 +1,105 @@
+from __future__ import print_function
+from openlibrary.catalog.read_rc import read_rc
+import httplib
+import web
+import time
+import sys
+import os
+
+rc = read_rc()
+accesskey = rc['s3_accesskey']
+secret = rc['s3_secret']
+#arc_dir = '/2/edward/amazon/arc'
+arc_dir = '/0/amazon'
+
+no_bucket_error = '<Code>NoSuchBucket</Code>'
+internal_error = '<Code>InternalError</Code>'
+
+done = [
+    '20100210013733.arc',
+    '20100210015013.arc',
+    '20100210020316.arc',
+    '20100210021445.arc',
+    '20100210022726.arc',
+    '20100210024019.arc',
+    '20100210025249.arc',
+    '20100210030609.arc',
+    '20100210031752.arc',
+    '20100210033024.arc',
+    '20100210034255.arc',
+    '20100210035501.arc',
+    '20100210040904.arc',
+    '20100210042130.arc',
+    '20100210043351.arc',
+    '20100210044553.arc',
+    '20100210051017.arc',
+    '20100210052258.arc',
+    '20100210053601.arc',
+    '20100210194700.arc',
+    '20100210201110.arc',
+    '20100212000643.arc',
+    '20100212001705.arc',
+    '20100212002656.arc',
+    '20100212004512.arc',
+    '20100212010934.arc',
+    '20100212013415.arc',
+    '20100212015925.arc',
+    '20100212022248.arc',
+    '20100212024600.arc',
+    '20100212030916.arc',
+    '20100212033221.arc',
+    '20100212035616.arc',
+    '20100212042043.arc',
+    '20100212044622.arc',
+    '20100212051112.arc',
+    '20100212053604.arc',
+    '20100212060140.arc',
+    '20100212062647.arc',
+    '20100212065128.arc',
+    '20100212165731.arc',
+    '20100212184748.arc',
+    '20100212184807.arc',
+    '20100212184822.arc',
+    '20100212190147.arc',
+    '20100212192404.arc',
+    '20100212194513.arc',
+    '20100212200700.arc',
+    '20100212202810.arc',
+    '20100212204852.arc',
+    '20100212210951.arc',
+    '20100212213032.arc',
+    '20100212215107.arc'
+]
+
+def put_file(con, ia, filename, headers):
+    print('uploading %s' % filename)
+    headers['authorization'] = "LOW " + accesskey + ':' + secret
+    url = 'http://s3.us.archive.org/' + ia + '/' + filename
+    print(url)
+    data = open(arc_dir + '/' + filename).read()
+    for attempt in range(5):
+        con.request('PUT', url, data, headers)
+        res = con.getresponse()
+        body = res.read()
+        if '<Error>' not in body:
+            return
+        print('error')
+        print(body)
+        if no_bucket_error not in body and internal_error not in body:
+            sys.exit(0)
+        print('retry')
+        time.sleep(5)
+    print('too many failed attempts')
+
+ia = 'amazon_book_crawl'
+for filename in os.listdir(arc_dir):
+    if filename in done:
+        continue
+    if not filename.endswith('.arc'):
+        continue
+    print(filename)
+    con = httplib.HTTPConnection('s3.us.archive.org')
+    con.connect()
+    put_file(con, ia, filename, {})
+    con.close()
+
diff --git a/ia-legacy-importer/author/__init__.py b/ia-legacy-importer/author/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/ia-legacy-importer/author/east b/ia-legacy-importer/author/east
new file mode 100644
index 00000000..7f2d0084
--- /dev/null
+++ b/ia-legacy-importer/author/east
@@ -0,0 +1,2156 @@
+Ai, Wei
+An, Bin
+An, Na
+An, Ni
+An, Zhimin
+Bai, Juyi
+Bai, Lin
+Bai, Nanfeng
+Bai, Tao
+Bai, Tian
+Bai, Yongquan
+Bai, Ziran
+Ban, Chao
+Bao-Liang, Lu
+Bao, Lin
+Bao, Zheng
+Ben, Lee
+BIAO, XIANG
+Bi, Chao
+Bing, Wang
+Bockja, Kim
+Boqiao, Tang
+Bo, Yang
+Bo, Yibo
+Bruno, Lee
+Bu, Di
+Cai, Cheng
+Cai, Chusheng
+Cai, Guo-Qiang
+Cai, Jingfeng
+Cai, Longyun
+Cai, Qian
+Cai, Ruixian
+Cai, Wenji
+Cai, Xiansheng
+Cai, Yong
+Cai, Yuanpei
+Cai, Yun
+Cang, Xin
+Cao, Pei
+Cao, Pi
+Cao, Van Vien
+Cao, Yang
+Cao, Ying
+Cao, Yuzhang
+Cao, Zhi
+Cao, Zuorui
+Chan, Chee Onn
+Chan, Chee-yan
+Chan, Chen Hei
+Chang, Chao
+Chang, Chen
+Chang, Ch?eng-mei
+Chang, Ch'eng-mei
+Chang, Chung-yuan
+Chang, Fa-shun
+Chang, Hao
+Chang, Hsin-chang
+Chang, Hsin-hai
+Chang, Hui-chien
+Chang, Hung Ta
+Chang, Hwan Kim
+Chang, Liu
+Chang, Ping-lin
+Chang, Shu
+Changsu, Kim
+Chang, Ti-sheng
+Chan, Heng Chee
+Chan, Heng Leong
+Chan, Kai Lok
+Chan, Kok Sing
+Chan, Tak Cheung
+Chan, Wai Kwan
+Chaochen, Zhou
+Chao, Hung-pen
+Chao, Hung-pe?n
+Chao, Jiping
+Chao, Lin
+Chao, Shu-li
+Chao, T'ing-chi
+Chao, Tzee Cheng
+Chao, Yi
+Chao, Yu
+Chawnshang, Chang
+Cheah, Hock Beng
+Cheah, Jin Seng
+Cheah, Yin Mee
+Chen, Ai Ju
+Chen, Baochen
+Chen, Bingfu
+Chen, Boda
+Chen, Changming
+Chen, Cheng
+Chen, Chong Swee
+Chen, Chuan Chong
+Chen, Ci Liang
+Chen, Dao
+Chen, Deren
+Chen, Dong
+Chen, Duxiu
+Chen, Erjin
+Chen, Fu
+Cheng, Chien
+Cheng, Ching-wen
+Cheng, Dan-an
+Chen, Ge
+Chen, Geng
+Chen, Gengtao
+Cheng, Fang
+Cheng, Fangwu
+Cheng, Gong
+Cheng, Guan
+Cheng, He
+Cheng, Hsieh
+Cheng, Hui
+Cheng, Kam Fong
+Cheng, Ku
+Chengliang, Zhu
+Cheng, Lu
+Cheng, Manchao
+Cheng, Meizhen
+Cheng, Ming Yu
+Chen, Gongbo
+Cheng, Peng
+Cheng, Qing
+Cheng, Qinghua
+Cheng, Ren
+Cheng, Shifa
+Chen, Gu
+Chen, Guansheng
+Chen, Guo
+Cheng, Weidong
+Cheng, Yanqiu
+Cheng, Zhang
+Cheng, Zhenqiu
+Chen, Haiyan
+Chen, He
+Chen, Hongmou
+Chen, Hsi-Ju
+Chen, Huiguan
+Chen, Jai-Sheng
+Chen, Ji
+Chen, Jia'er
+Chen, Jieru
+Chen, Jihai
+Chen, Jinding
+Chen, Jingpan
+Chen, Jirui
+Chen, Kaige
+Chen, Lian
+Chen, Liang Yu
+Chen, Liang-Yu
+Chen, Lifang
+Chen, Lu
+Chen, May Yee
+Chen, Meng
+Chen, Meng-chia
+Chen, Mingyuan
+Chen, Pixian
+Chen, Qingchao
+Chen, Ruoxi
+Chen, Tong
+Chen, Tze-tuan
+Chen, Voon Fee
+Chen, Weiye
+Chen, Xi
+Chen, Xihe
+Chen, Xuezhao
+Chen, Yanqing
+Chen, Yifei
+Chen, Yinke
+Chen, Yongfu
+Chen, Yongguo
+Chen, Yonglin
+Chen, Yun
+Chen, Yun-Chung
+Chen, Yunlin
+Chen, Zelin
+Chen, Zhaoxia
+Chen, Zhi
+Chen, Zhi'an
+Chen, Zhiyuan
+Chen, Zhong
+Chen, Zhu
+Chen, Zhucai
+Chen, Zongji
+Chen, Zude
+Chia, Chen
+Chiang, Chin
+Chiang, Ching-kuo
+Chiang, Huan-ching
+Chiang, Kai-shek
+Chiang, Kai-Shek
+Chiang, K'ang-hu
+Chiang, Kang-hu
+Chiang, Kuei
+Chiang, Lan-hung Nora
+Chiang, Su-hui
+Ch'iao, Chien
+Chiao, Chien
+Chieh, Liu
+Chih-Tung, Chang
+Chi, Li
+Chin, Kin Wah
+Chin, Kok Fay
+Chin, Peng
+Choan-Seng, Song
+Cho, Hee
+Cho, Hyun-Chul
+Choi, Jungwoon
+Choi, Yong-Ho
+Choi, Young
+Chong, Song-won
+Chong, Yap Seng
+Chong, Yi
+Chou, Bih-Er
+Chou, Ching-wen
+Chou, En-lai
+Chou, Fu
+Chou, Ping
+Chou, Shun-hsin
+Chou, Wen-Chung
+Chou, Zhang
+Cho, Van Tran
+Cho, Wha Soon
+Cho, Young-rae
+Chuang, Chuang Tsai
+Chuang, Hua
+Chuang, Ying-chang
+Chu, Anping
+Chuan, Yu
+Chu, Ching-wu
+Chu, Ching-Wu
+Chu, Dagao
+Chu, Djang
+Chu, Li
+Chu, Minyi
+Chun, Doo Hwan
+Chun, Soonok
+Chun, Soon-ok
+Chun, Tao
+Chu, Va?n Ta??n
+Chu, Yo-han
+Chu, Youyi
+Chu, Youyi 
+Cui, Shuyi
+Cui, Shuzhi
+Cui, Yingjie
+Cui, Yongqiang
+Cui, Yu
+Dai, Guan
+Dai, Jinhua
+Dai, Qing
+Dai, Sijie
+Dai, Wangshu
+Dai, Xi
+Dai, Xianglong
+Dai, Zhong
+Daxing, Han
+Dazhong, Xu
+De-cheng, Luo
+Deng, Jun
+Deng, Xiaoping
+Deng, Yingchao
+Ding, Chen
+Ding, Qiulin
+Ding, Song
+Ding, Wei
+Dingyi, Lu
+Ding, Zheng
+Ding, Zhongli
+Dong, Biwu
+Dongfang, Wang
+Dong, Guangchang
+Dong, Han
+Dong, He
+Dong, Jie
+Dong, Jinxia
+Do, Ngoc Diep
+Dong, Shizhong
+Dong, Yu
+Dong, Zhiming
+Dong, Zhongshu
+Donovan, Lee
+Du, Fu
+Du, Guangting
+Du, Jian'guo
+Du, Juan
+Du, Liang
+Du, Ling
+Du, Liping
+Duong, Le Quy
+Duong, Tan Nhut
+Duong, Thanh Bi?nh
+Du, Qinggang
+Du, Xia
+Du, Xiangwan
+Du, Zheng
+Ersheng, Gao
+Eu-Yang, Kwang
+Fang, Dan
+Fang, Di
+Fang, Ding
+Fang, Guan
+Fang, Huang
+Fang, Lizhi
+Fang, Ning
+Fang, Qian
+Fang, Xiang
+Fang, Zhaoben
+Fang, Zhi-yang
+Fang, Zhong
+Fan, Hai-fu
+Fan, He
+Fan, Hong
+Fan, Kang
+Fan, Keh-Li
+Fan, Ren
+Fan, Shen
+Fan, Shou-shan
+Fan, Wang
+Fei, Dawei
+Fei, Xiaotong
+Fei, Xin
+Feng, Boyi
+Feng, Congying
+Feng, Fang
+Feng, Guomei
+Feng, Jiannan
+Feng, Jicai
+Feng, Lei
+Feng, Menglong
+Feng, Shi
+Feng, Shu
+Feng, Wu
+Feng, Xu
+Feng, Youlan
+Feng, Yuxiang
+Feng, Zhaoshu
+Feng, Zhiqiang
+Fu, Baoshi
+Fu, Biao
+Fu, Chongyue
+Fu, Chunjiang
+Fu, Lin
+Fung, Chi Ming
+Fu, Ping
+Fu, Tianchou
+Fu, Xi
+Fu, Yi
+Fu, Yiyuan
+Fu, Zheng
+Fu, Zhongwen
+Fu, Zizhi
+Gan, Fu
+Gang, Fan
+Gan, Gu
+Gang, Yi
+Gan, Tang
+Gao, Chien
+Gao, Chongshou
+Gao, Ertai
+Gao, gang
+Gao, Gang
+Gao, Hong
+Gao, Jun
+Gao, Lin
+Gao, Min
+Gao, Qiang
+Gao, Wei
+Gao, Xingjian
+Gao, Xueyu
+Gao, Yaojie
+Gao, Zhan
+Gao, Zhenzhong
+Ge, Chuan'gui
+Ge, Hong
+Geng, Biao
+Geng, Han
+Geng, Junying
+Geng, Lin
+Geng, Yu
+Ge, Wen
+Ge, Xiao-jia
+Ge, Ying
+Ge, You
+Gita, May
+Goh, Chen Chuan
+Goh, Chok Tong
+Goh, Keng Swee
+Goh, Kim Leng
+Goh, Pei Ki
+Goh, Poh Seng
+Goh, Sing Yau
+Gong, Li
+Gongsun, Long
+Guang, Lu
+Guan, Hanqing
+Guan, Liang
+Guan, Tong
+Guan, Yu
+Gu, Cheng
+Gu, Gongxu
+Gu, Hongzhong
+Gu, Hui
+Gui, Lin
+Gui, Shixun
+Gu, Jiegang
+Gu, Jun
+Gu, Li
+Guo, Benyu
+Guo, Boling
+Guo, Daiheng
+Guo, Degang
+Guo, Huadong
+Guo, Juan
+Guo, Kaizhou
+Guo, Moruo
+Guo, Shi
+Guo, Wenbin
+Guo, Yingqiu
+Guo, Yue
+Guo, Yuji
+Gu, Shulin
+Gu, Wei
+Gu, Xingyuan
+Gu, Xiong
+Gu, Yan
+Gu, Yuan
+Gu, Zhenqing
+Gu, Zhiwei
+Han, Changfu
+Han, Chong
+Han, Dongfang
+Han, Fei
+Han, Fook Kwang
+Han, Fu-ru
+Han, Lianfen
+Han, Mac T?u
+Han, Meilin
+Han, Mui Ling
+Han, Shaogong
+Han, Suyin
+Han, Tang
+Han, Wu
+Han, Xiang
+Han, Xin
+Han, Yazhou
+Han, Yi
+Han, Zhong
+Hao, Jie
+He, Chang
+He, Changling
+He, Da
+He, Fei
+He-guang, Wu
+He, Hanqiu
+He, Jie
+He, Jifeng
+He, Jiuying
+He, Li
+Heng, Chau
+Heng, Chye Kiang
+Heng, Sure
+He, Ping
+Heping, Yu
+He, Qinglian
+He, Shi
+He, Tian
+He, Ying
+He, Yingqin
+He, Yuan-Jin
+He, Zuoxiu
+Hoang, Chu Duy
+Hoang, H?ai Thu?y
+Hoang, Ngoc Lung
+Ho, Chi Wing
+Ho, Chung
+Ho, Hsiang-ning
+Ho, Mian Lian
+Hong, Cao
+Hong, Chang
+Hong, Chengchou
+Hong, Hao
+Hong, Qiu
+Hong, Ren
+Hong, Rengan
+Hong, Seung-pyo
+Hong, Su
+Hong, Xuntao
+Hong, Yin
+Hong, Ying
+Hong, Yingming
+Hong, Yu
+Hong, Yun-suk
+Hong, Zhang
+Ho, Peng Kee
+Ho, Rih Hwa
+Hou, Jianping
+Hou, Jinglun
+Hou, Wai-lu
+Hou, Xianguang
+Ho, Wing Meng
+Ho, Yi
+Ho, Yuk Ming
+Hua, Gang
+Hua, Guofeng
+Hua, Junwu
+Hua, Kang
+Hua, Lu
+Hua, Luogeng
+Huang, Bing-shan
+Huang, Bingsheng
+Huang, Bingyin
+Huang, Chieh
+Huang, Da
+Huang, Ertian
+Huang, Fan
+Huang, Fu
+Huang, Geng
+Huang, Gongwang
+Huang, Jianping
+Huang, Kun
+Huang, Po
+Huang, Qi
+Huang, Qian
+Huang, Qun
+Huang, Songjie
+Huang, Tsung-hsi
+Huang, Weiwen
+Huang, Xiaokai
+Huang, Xiaoming
+HUANG, XIAOMING
+Huang, Xing
+Huang, Yan
+Huang, Yao
+Huang, Yaozeng
+Huang, Yong Ping
+Huang, Zhenhua
+Huang, Zhihong
+Huang, Zunxian
+Huan, Li
+Hua, Wang
+Hua, Wu Yin
+Hua, Yun
+Hu, Baotong
+Hu, Chen
+Hu, Ch'iao-mu
+Hu, Fang
+Hu, Hanmin
+Hu, Hesheng
+Hu, Hsiu-ying
+Hui, Wang
+Hui, Yuan
+Hui, Zhou
+Hu, Jianxiong
+Hu, Jinchu
+Hu, Jun
+Hung, Kwok-yuen
+Hung, Leung-kim
+Hung, Ying-ming
+Hu, Ning
+Huo, Wang
+Hu, Qing
+Hu, shi
+Hu, Shi
+Hu, Shiguang
+Hu, Shih Chang
+Hu, Shih-Chang
+Hu, Tian
+Hu, Xiabo
+Hu, Yaobang
+Hu, Yongkai
+Hu, Zhihui
+Hu, Zhong-xiong
+Hwang, Sun-Ae
+Hwang, Yin
+I, Cheng
+Jaihiun, Kim
+Jiang, Bo
+Jiang, Guoliang
+Jiang, Hong
+Jiang, Huan
+Jiang, Jiehong
+Jiang, Jin
+Jiang, Leiwen
+Jiang, Pan
+Jiang, Ping
+Jiang, Qian
+Jiang, Qing
+Jiang, tianji
+Jiang, Wen
+Jiang, Yiming
+Jiang, Ying
+Jiang, Yu
+Jiang, Yuan
+Jiang, Zemin
+Jiang, Zhongyi
+Jian, Hu
+Jian, Xianai
+Jian, Xian'ai
+Jian, Zhao
+Jiao, Bo
+Jiao, Guorui
+Jiao, Shunfa
+Ji, Dachun
+Jie, Chen
+Jie, Liang
+Jie, Ouyang
+Jie, Yuan
+Ji, Junxiang
+Jikun, Liu
+Ji, Lanwei
+Ji, Lin
+Jin, Bohong
+Jin, Cui
+Jin, Di
+JIN, DI
+Jin, Dongyan
+Jing, Chi
+Jing, Heng
+Jing, Ke
+Jing, Qi
+Jing, Qing
+Jingqing, Yang
+Jing, Su
+Jin, Hui De
+Jin, Jiang
+Jin, Jie
+Jin, Jing
+Jin, Li
+Jin, Lin
+Jin, Nailu
+Jin, Wei
+Jin, Xuqi
+Jin, Yong
+Jin, Yun
+Ji, Qiang
+Ji, Si
+Ji, Yuan
+Ji-zhou, Yang
+Jongsung, Kim
+Ju, Zi
+Kai, Chen
+Kai, Zheng
+Kang, Bao
+Kang, Feng
+Kang, Han
+Kang, Mi-sun
+Kang, Nae-hui
+Kang, Sheng
+Kang, Youwei
+Katayama, Sen
+Kawada, Jun
+Ke, Chi
+Ke, Fu
+Ke, Huang
+Ke, Li
+Ke, Qin
+Ke, Yan
+Ke, Yun Lu
+Khoo, Boo Teik
+Khoo, Hong Woo
+Khoo, Hoon Eng
+Khoo, Joo Ee
+Khoo, Kheng-Hor
+Khoo, Seow Hwa
+Khoo, Swee Chiow
+Kiang, Kang-hu
+Kim, Chie-woon
+Kim, Chi-ha
+Kim, Choong Han
+Kim, Chull Baum
+Kim, Do-Kyun
+Kim, Dong-sung
+Kim, Dongwook
+Kim, Hak-Joon
+Kim, Heechul
+Kim, Ho
+Kim, Hyo-jin
+Kim, Hyung-A
+Kim, In
+Kim, Jang-Soo
+Kim, Jong-Il
+KIM, JONG-IL
+Kim, Jong Kil
+Kim, Kang-wo?n
+Kim, Kang Won
+Kim, Kap-su
+Kim, Kihwan
+Kim, Ki-Young
+Kim, Kwang Soo
+Kim, Kwang-sun
+Kim, Kyu-sik
+Kim, Pyung Soo
+Kim, Ronyoung
+Kim, San
+Kim, Sang-jin
+Kim, Sung-il
+Kim, Sung-Soo
+Kim, Sung-woo
+Kim, Su-yong
+Kim, Tae-gyun
+Kim, Tae Hee
+Kim, Tae-Young
+Kim, Unsoo
+Kim, Yong-dae
+Kim, Yong-il
+Kim, Yong-Nam
+Kim, Yo?n-kyo?ng
+Kim, Young-Sub
+Kim, Young-Suk
+Kin, Long
+Kuan, Hsin-chi
+Kuan, Liang
+Ku, Fu-sheng
+Ku, Hung-ming
+Kung, Chen
+Kuo, Chu-kun
+Kuo, Lien Ying
+Kuo, Ping-chia
+Kuo, Sung-t'ao
+Ku, Sang
+Lai, Kwok Kin
+Lai, Nam Chen
+Lai, Po Kan
+Laney, Lee
+Lang, Li
+Lan, Luh Luh
+Lan, Peijin
+Lan, Yu
+Le, Duc Thuong Thuy
+Lee, Chang-Ho
+Lee, Chew Kang
+Lee, Chi Ho
+Lee, Chin-Chiu
+Lee, Chin Koon
+Lee, Chung Hing
+Lee, Ding Fai
+Lee, Dongju
+Lee, Dong Wook
+Lee, Gek Ling
+Lee, Hoi-Chang
+Lee, Ho Yin
+Lee, Hsien Loong
+Lee, Kin Kiong
+Lee, Kuan Yew
+Lee, Kwan
+Lee-Lueng, Fu
+Lee, May
+Lee, Na Hyeon
+Lee, Sang-Bok
+Lee, Sang-Hun
+Lee, Sun-ai
+Lee, Sun-young
+Lee, Teng-hui
+Lee, Tsao Yuan
+Lee, Tzu Pheng
+Lee, Wai Heng
+Lee, Wai-man
+Lee, Weng Choy
+Lee, Ying-arng
+Lee, Ying-Yuan
+Lee, Young-Jin
+Lei, Chen
+Lei, Congyun
+Lei, Guang
+Lei, Li
+Lei, Qin
+Le, Manh Hung
+Le, Thac Can
+Le, Thi Van Hue
+Liang, Chen
+Liang, Ji
+Liang, Liangxing
+Liang, Peilong
+Liang, Qi
+Liang, qichao
+Liang, Qichao
+Liang, Sicheng
+Liang, Xiao
+Liang, Xin
+Liang, Yan
+Liang, Yu
+Liang, Yuan
+Li, Ao
+Liao, Chen
+Liao, Zhongkai
+Li, Bing
+Li, Bing-Ren
+Li, Chai
+Li, Chengli
+Li, Chengsen
+Li, Chien-nung
+Li, Ching
+Li, Chuan-Kuei
+Li, Chun
+Li, Chunfeng
+Li, Chung
+Li, Chunxia
+Li, Cunxin
+Li, Dai
+Li, Dajue
+Li, Daosheng
+Li, Dazhao
+Li, Dejin
+Li, Deming
+Li, Deng
+Li, Desheng
+Li, Deyin
+Lien, Chan
+Lienfung, Li
+Li, Fanggui
+Li, Gonglin
+Li, Guang
+Li, Guo
+Li, Haopei
+Li, Ho
+Li, Hongzhang
+Li, Hongzhi
+Lihua, Yang
+Li, Jiajun
+Li, Jiangshu
+Li, Jiaqi
+Li, Jinshan
+Li, Kaining
+Li, Kun
+Li, Lan
+Li, Lanqing
+Li, Lian Ong
+Li, Lisan
+Li, Liu
+Li, Lu
+Li, Mao
+Lim, Bee-Lum
+Lim, Boon Keng
+Lim, Chu Sing
+Li, Meng
+Lim, Guan Hua
+Li, Min
+Li, Mingzhu
+Lim, Jae-Won
+Lim, Li Ching
+Lim, Li Lin
+Lim, Poh Eng
+Lim, Yew Hock
+Li, Na
+Lin, Biao
+Lin, Cheng
+Lin, Dan
+Lin, Fanghua
+Lin, Fengmian
+Ling, Chung
+Ling, Kong
+Ling, Li
+Ling, Liu
+Lin, Gu
+Ling, Yeou-ruenn
+Ling, Yuan
+Lin, Handa
+Lin, Huang
+Li, Nina
+Li, Ning
+Lin, Jensen
+Lin, Jianhua
+Lin, Lap-Chew
+Lin, Li
+Lin, Lu?
+Lin, Piao
+Lin, Qian
+Linshan, Hua
+Lin, Shaopei
+Lin, Tsung-yi
+Lin, Tsung-Yi
+Lin, Xie
+Lin, Xu
+Lin, Ying
+Lin, Yue
+Lin, Yutang
+Lin, Zexu
+Lin, Zhan
+Lin, Zhengyan
+Lin, Zhong
+Lin, Zuo
+Li, Peiwen
+Li, Peizhu
+Li, Peng
+Li, Qian
+Li, Qiangsheng
+Li, Qingzhao
+Li, Qunying
+Li, Ren
+Li, Ruihuan
+Li, Ruinian
+Li, Shangyin
+Li, Shang-yin
+Li, Shantong
+Li, Shiji
+Li, Shizhen
+Li, Shuang
+Li, Shutian
+Li, Si
+Li, Siguang
+Li, Songfu
+Li, Su
+Li, Tai
+Li, Tan
+Li, Tana
+Li, Tang
+Li, Tche-houa
+Li, Tie
+Liu, Bao
+Liu, Binyan
+Liu, Cengdian
+Liu, Chen
+Liu, Chengcai
+Liu, Chen Hui
+Liu, Chih
+Liu, Chin
+Liu, Ching
+Liu, Chuang
+Liu, Dong
+Liu, Dongping
+Liu, Fang
+Liu, Fei
+Liu, Fuhua
+Liu, Gongwang
+Liu, Guoliang
+Liu, Haisu
+Liu, Han Wen
+Liu, Heung Shing
+Liu, Huan
+Liu, Huaqing
+Liu, Hua yang
+Liu, Hua-yang
+Liu, Huihao
+Liu, Huixia
+Liu, I-ming
+Liu, Jian
+Liu, Jianjun
+Liu, Jing-tong
+Liu, Ji-ping
+Liu, Ju
+Liu, Jung-en
+Liu, Kai
+Liu, Kunyi
+Liu, Li
+LIU, LI
+Liu, Liping
+Liu, Qiming
+Liu, Shaoqi
+Liu, Shehui
+Liu, Shicong
+Liu, Shuzhen
+Liu, Taigong
+Liu, Tao
+Liu, Ts'un-yan
+Liu, Weixin
+Liu, Wenhui
+Liu, Wenmin
+Liu, Wenzhe
+Liu, Xia
+Liu, Xiaobo
+Liu, Xiaoqing
+Liu, Xing
+Liu, Xingzhen
+Liu, Xinwu
+Liu, Xujie
+Liu, Yandong
+Liu, Ye
+Liu, Yongqing
+Liu, Yuanman
+Liu, Yun
+Liu, Yunfeng
+Liu, Zaihua
+Liu, Zaixing
+Liu, Zhenkai
+Liu, Zhijun
+Liu, Zhiwei
+Liu, Zhonglu
+Li, Weining
+Li, Wenliang
+Li, Wenyan
+Li, Xi
+Li, Xiangdong
+Li, Xiaofeng
+Li, Xiaoxiang
+Li, Xieu-Lin
+Li, Xinyuan
+Li, Xuemei
+Li, Xuewu
+Li, Ye
+Li, Yi
+Li, Yihua
+Li, Yinhe
+Li, Yong
+Li, Yuanhong
+Li, Yuchun
+Li, Yu-ming
+Li, Yunfei
+Li, Zhaoxiang
+Li, Zhaoxing
+Li, Zheng
+Li, Zhenji
+Li, Zhenjie
+Li, Zhensheng
+Li, Zhiwu
+Li, Zhuo
+Li, Zigan
+Li, Zishun
+Li, Zongren
+Li, Zongwei
+Li, Zunian
+Lo, Chiung-yu
+Lo, Hsiang-lin
+Lo, Kuang-pin
+Lo, Mei Hing
+Long, Xu
+Lu, Chuanrong
+Lu, Daren
+Lu, Feng
+Lufeng, Tang
+Lu, Gusun
+Lu, Jiaquan
+Lu, Jiuyuan
+Lu, Le
+Lu, Li
+Lu, Meng
+Luo, Jialun
+Luo, Ruiqing
+Luo, Ti-lun
+Luo, Wei
+Luo, Weihong
+Luo, Yang
+Luo, Yin
+Luo, Zewen
+Luo, Zhaohong
+Lu, Ruilan
+Lu, Shengli
+Lu, Sheng-yen
+Lu, Shi
+Lu, Shoukang
+Lu, Shun
+Lu, Ting
+Lu, Xinchang
+Lu, Xinhua
+Lu, Xinsen
+Lu, Xixing
+Lu, Yubin
+Lu, Zhan
+Ma, Baolin
+Ma, Chih
+Ma, Cindy W
+Ma, Huan
+Ma, Ji
+Ma, Kai
+Ma, ke
+Malborg, Kim
+Ma, Lunzy
+Ma, Mingjia
+Ma, Mingtong
+Ma, Ngok
+Ma, Ning
+Mao, Dun
+Mao, Peiqi
+Mao, Yan
+Mao, Zedong
+Ma, Shijun
+Ma, Shuli
+Ma, Wen
+Ma, Xia
+Ma, Xiaodong
+Ma, Yinchu
+Ma, Ying
+Ma, Ying-jeou
+Ma, Zhiyuan
+Ma, Zhonglin
+Ma, Zongjin
+Mei, Ding
+Mei, Hua
+Mei, Lin
+Mei, Ying
+Mei, Zhang
+Mei, Zu-yan
+Meng, Hao-jan
+Meng, Haoran
+Meng, Hua
+Meng, Jian
+Menglin, Zhao
+Meng, Shen
+Meng, Xi
+Meng, Xiankun
+Meng, Xianshi
+Meng, Yue
+Miao, Ying
+Ming, Fan
+Ming, Hai
+Ming, Ho-Yu
+Ming-le, Yao
+Ming, Lu
+Min, Jiayin
+Min, Xu
+Min, You
+Mo, Bangxian
+Mo, Yamin
+Mo, Yan
+Mo, Yang
+Mu, Soeng
+Mu, Soeng Sunim
+Mu, Xia
+Mu, Zi
+Nanquan, Lu
+Ng, Aik Kwang
+Ng, Bee Chin
+Ng, Beng Yeong
+Ng, Chee Yuen
+Ng, Chin-Keong
+Ng, Hock Guan
+Ng, Ho-yee
+Ng, Kung-fu
+Ng, Pak Tee
+Ng, Seik Weng
+Ng, Suat Tong
+Nguyen, Dinh Huu
+Nguyen, Duc Hiep
+Nguyen, Duy Thai Son
+Nguyen, Khanh
+Nguyen, Thanh Hai
+Nguyen, Thi Dieu
+Nguyen, Thi Minh Ha
+Nguyen, Thi Thanh Binh
+Nguyen, Van Canh
+Nguyen, Van Chuyen
+Nguyen, Van Dao
+Nguyen, Van Ly
+Nguyen, Van Nghi
+Nguyen, Van Thoai
+Nguyen, Viet Dung
+Nguyen, Viet Thanh
+Nguyen, Xuan Oanh
+Nguyen, Xuan Thu
+Ng, Wun Jern
+Ning, Qiang
+Ouyang, Yi
+Ouyang, Yu
+Pan, Chengbiao
+Pan, Chengdong
+Pan, Guxi
+Pan, Jiezi
+Pan, Ling
+Pan, Song
+Pan, Tianshou
+Pan, Wuhua
+Pan, Xiafeng
+Pan, Yue
+Pan, Yunhe
+Pei-ji, Chen
+Pei-kang, Chang
+Peilin, Sun
+Pei, Songzhi
+Pei, Yan
+Peng, Dehuai
+Peng, Feng
+Peng, Liang
+Peng, Ming-min
+Peng, Peiyun
+Peng, Shengchao
+Peng, Shi
+Peng, Xianchu
+Peng, Zhen
+Phan, Chu Trinh
+Phan, Nhie?n Ha?o
+Phan, Thie??n Cha?u
+Pi, Lei
+Pi, Li
+Ping, Fan
+Ping, Xin
+Ping, Zhou
+Po, Lee
+Po, Sung-nien
+Pu, Wei
+Qiang, Dong
+Qiang, Han
+Qiang, Zhang
+Qian, Li
+Qian, Lin
+Qian, Ma
+Qian, Mei
+Qian, Qichen
+Qian, Shi
+Qian, Wu
+Qian, Xuantong
+Qian, Yongfu
+Qian, Zheng
+Qian, Zhengying
+Qian, Zhongshu
+Qiao, Hong
+Qiao, Jinlin
+Qiao, Yi
+Qi, Baishi
+Qi, Dong
+Qi, Huang
+Qi, Jiguang
+Qi, Min
+Qin, Danhua
+Qin, Xiao-meng
+Qin, Yu
+Qin, Zhong
+Qi, Pan
+Qi, Peng
+Qiqian, Li
+Qiu, Jin
+Qiu, Jun
+Qiu, Yu
+Qi, Xin
+Qi, Yan
+Qiying, Hu
+Qu, Bo
+Ren, De-lin
+Ren, Guang
+Ren, Jianxin
+Ren, Jie
+Ren, Jishun
+Ren, Lu
+Ren, Wu
+Ren, Xingsheng
+Ren, Xiong
+Ren, Yi
+Ren, Yongchang
+Ren, Zhong
+Ruan, Huaduan
+Ruan, Ji
+Rui, Guozhang
+Rui, Lin
+Rui, Mu
+Rui, Naiwei
+Rui, Zhang
+Sha, Jicai
+Sha, Kokken
+Sha, Lin
+Shang, Xianmin
+Shang, Yuan Ren
+Shao-kung, Lin
+Shao, Wei Liu
+Shao, Xunzheng
+Shao, Ya
+Sha, Yexin
+Shen, Baozhen
+Sheng, Huanye
+Sheng, Lijun
+Sheng, Peilin
+Sheng, Shicai
+Sheng, Zhi-yong
+Shen, Huang
+Shen, Jiaben
+Shen, Jianmin
+Shen, Jie
+SHEN, JIE
+Shen, Junru
+Shen, Kai
+Shen, Kangshen
+Shen, Kuo
+Shen, Li
+Shen, Weirong
+Shen, Xianjie
+Shen, Zhang
+Shen, Zhao-wen
+Shen, Zhou
+Shen, Ziyin
+Shi, Chen
+Shi, Hui
+Shi, Jun
+Shi, Kefa
+Shi, Lang
+Shi, Min
+Shimin, Geng
+Shi, Qinan
+Shi, Song
+Shi, Tao
+Shi, Wei
+Shi, Xiaojing
+Shi, Xiaoqing
+Shixuan, Xu
+Shi, Yan
+Shi, Young
+Shi, Yu
+Shi, Zuhui
+ShouQing, Wang
+Shui, Wei
+Shui, Yi
+Shu, Li
+Shu, Lin
+Si, Chi Ko
+Si, Ma
+Sima, Qian
+SiMa, Qian
+Si, Ren
+Situ, Tan
+Si, Yuan
+Song, Ci
+Song, Dong-Wook
+Song, Geng
+Song, Jiaoren
+Song, Jinshou
+Song, Nong
+Song, Ping
+Song, Qi
+Song, Shouxiang
+Song, Wan
+Song, Wu
+Song, Xing-Chang
+Song, Yankun
+Song, Yu
+Song, Zheyuan
+So-Young, Lee
+Su, Dajun
+Su, Fu
+Su, Hao
+Su, Hua
+Su, Huana
+Su, Ling
+Sun, Chao
+Sun, Chengnan
+Sun, Fuchu
+Sun, Guangyuan
+Sun, Haichen
+Sun, Han
+Sun, Jian
+Sun, Jianhong
+Sun, Kaitai
+Sun, Liang
+Sun, Ou
+Sun, Shifang
+Sun, Shuyun
+Sun, Wu
+Sun, Xiang
+Sun, Xiaochun
+Sun, Xingyuan
+Sun, Xu
+Sun, Xue-quan
+Sun, Yanqing
+Sun, Yat-sen
+Sun, Yingjie
+Sun, Youjun
+Sun, Yue
+Sun, Zhen
+Sun, Zhiwei
+Sun, Zuxun
+Su, Rong
+Su, Shi
+Su, Wenming
+Su, Xiaojun
+Su, Yu
+Su, Zongwei
+Taeho, Kim
+Tai, Chen
+Tai, Ming Cheung
+Takashi, Inoguchi
+Takashi, Negishi
+Tan, Ai Mei
+Tan, Beng Luan
+Tan, Boon Tee
+Tan, Cheng Han
+Tan, Cheng Lock
+Tan, Chin Kwang
+Tan, Chong Kee
+Tan, Dun
+Tang, Jinfa
+Tang, Jing
+Tang, Junyi
+Tang, Li
+Tang, Ting-Ao
+Tang, Wei
+Tang, Xiaofang
+Tang, Xiren
+Tang, Yin
+Tang, Yungmei
+Tang, Zhaoliang
+Tang, Zhou
+Tan, Hong
+Tan, Hong Yew
+Tan, Huaixiang
+Tan, Jiazhen
+Tan, Juay Miang
+Tan, Khee Giap
+Tan, Kok-Keong
+Tan, Koonlin
+Tan, Lee Meng
+Tan, Lin-tung
+Tan, Loke Khoon
+Tan, Mew Hong
+Tan, Ong Bee
+Tan, Phay Ping
+Tan, Siew Ee
+Tan, Siew Sin
+Tan, Sitong
+Tan, Sok Khim
+Tan, Soo Jiuan
+Tan, Su-Lyn
+Tan, Tai Wei
+Tan, Tee Jim
+Tan, Teik-Kheong
+Tan, Thiam Soon
+Tan, Tin Wee
+Tan, Yang Meng
+Tan, Yankai
+Tan, Yew Hock
+Tan, Yew Soon
+Tan, Yi
+Tao, Cheng
+T'ao, Ch'ien
+T'ao, Chi'en
+Tao, Hua
+Tao, Jian
+Tao, Jin
+Tao, Xingzhi
+Tao, Zhang
+Tao, Zhenghua
+Tay, Boon Nga
+Teng, Chao-chao
+Teng, Chia-yee
+Thai, Ngoc Diep
+Thai, Quang Trung
+Tian, Jia
+Tie, Ning
+Tieya, Wang
+Tie, Yuan
+Ting, Joo Fai
+Ting, Li
+Ting, Su-Yin
+Ting, Wai
+Ting, Wang
+Ting, Wei
+Tong, Dizhou
+Tong, Jinnan
+Tong, Li
+Tong, Shijun
+Tong, Zhongtao
+Tong, Zhongyi
+Torrey, Kim
+Tsai, Chin
+Ts'ai, Yuan
+Tung, shu
+T'ung, Shu
+Vu, Thien Binh
+Vu, Trong Phung
+Wan, Changsen
+Wang, Anshi
+Wang, Anyi
+Wang, Bi
+Wang, Biao
+Wang, Bing
+Wang, Can
+Wang, Chen-ho
+Wang, Chi-ssu
+Wang, Chong
+Wang, Dao
+Wang, Dong
+Wang, Dulu
+Wang, Du Lu
+Wang, Dun
+Wang, Duo
+Wang, En'guang
+Wang, Fangyu
+Wang, Fanxi
+Wang, Fengzhu
+Wang, Fuchun
+Wang, Fuzhi
+Wang, Gu
+Wang, Guangmei
+Wang, Guangya
+Wang, Guangyi
+Wang, Hongtu
+Wang, Hongwen
+Wang, Hsing-pei
+Wang, Huan
+Wang, Huanan
+Wang, Huijiong
+Wang, Hui-ling
+Wang, Huiming
+Wang, Jiancheng
+Wang, Jianmin
+Wang, Jianzheng
+Wang, Jingwei
+Wang, Jinshan
+Wang, Jiye
+Wang, Kemin
+Wang, Kui
+Wang, Kun
+Wang, Kung-hsing
+Wang, Kuo-wei
+Wang, Liang
+Wang, Liangbi
+Wang, Liming
+Wang, Liqun
+Wang, Lixian
+Wang, Lixiong
+Wang, Lu
+Wang, Luxiang
+Wang, Maorong
+Wang, Min
+Wang, Ming
+Wang, Mingjie
+Wang, Pi
+Wang, Pin
+Wang, Pingyang
+Wang, Pinxian
+Wang, Qiliang
+Wang, Qinglin
+Wang, Qingyun
+Wang, Rongda
+Wang, Rui
+Wang, Sheng
+Wang, Sheng-Wei
+Wang, Shijun
+Wang, Shixun
+Wang, Shiyi
+Wang, Shizhen
+Wang, Shouren
+Wang, Shuo
+Wang, Song
+Wang, Sung
+Wang, Tieya
+Wang, Tongsan
+Wang, Tuoming
+Wang, Wenhua
+Wang, Wenjiong
+Wang, Xi
+Wang, Xianzhi
+Wang, Xiao
+Wang, Xiaobo
+Wang, Xiaoning
+Wang, Xiaotian
+Wang, Xiaoyan
+Wang, Xiaoyun
+Wang, Xing Chu
+Wang, Xiu
+Wang, Xizhi
+Wang, Xu
+Wang, Xuanjie
+Wang, Xuecheng
+Wang, Xuewen
+Wang, Yanrong
+Wang, Yao-t'ing
+Wang, Yi'e
+Wang, Yinzhi
+Wang, Yue
+Wang, Yuehan
+Wang, Zheng
+Wang, Zhengshu
+Wang, Zhengyi
+Wang, Zhiping
+Wang, Zhiwen
+Wang, Zhizhi
+Wang, Zhongchun
+Wang, Zhonggao
+Wang, Zhongyi
+Wang, Zili
+Wan, Kwai Pik
+Wan, Li
+WAN-SOON, KIM
+Wee, Kim Wee
+Wei, Dong
+Wei, Fajie
+Wei, Hu
+Wei, Ji
+Wei, Jingsheng
+Wei, Li Chen
+Wei, Liming
+Wei, Luo
+Weiming, Shen
+Wei, Ping
+Weiping, Wang
+Wei, Song
+Wei, Su
+Wei, Sui
+Wei, Tian
+Wei, Wen
+Wei, Wenbo
+Wei, Wenhua
+Wei, Xu
+Wei, Yan
+Wei, Yang
+Wei, Yuanping
+Wei, Yue
+Weiyu, Jiang
+Wei, Zhang
+Wei, Zhao
+Wei, Zhen
+Wen, Chi
+Wen, Ding
+Wen, Hao
+Wen, Hong
+Wen, Hua
+Wen, Jingen
+Wen, Jinhai
+Wenkuan, Ma
+Wen, Qing
+Wenqing, Wang
+Wen, Tianxiang
+Wen, Yiduo
+Wen, Yinghong
+Wen, You
+Wen, Yu
+Wen, Zhengming
+Wen, Zhenheng
+Wen, Zhong
+Whei-Jen, Chen
+Wong, Chian Voen
+Wong, Choon Ching
+Wong, Heung Wah
+Wong, Jim
+Wong, Kang-Ying
+Wong, Kar-wai
+Wong, Kin-yuen
+Wong, Kwei Cheong
+Wong, Kwok-Chu
+Wong, Phui Nam
+Wong, Shiu Hon
+Wong, Sook Ching
+Wong, Wah Sang
+Wong, Yew Kwan
+Wu, Chen
+Wu, Chengkang
+Wu, Chen-Xu
+Wu, Chong-shi
+Wu, Chou
+Wu, Chuanjun
+Wu, Daisheng
+Wu, Enyu
+Wu, Guang
+Wu, Guanghua
+Wu, Guanzhong
+Wu, Guo
+Wu, Hao
+Wu, Jialiang
+Wu, Jie
+Wu, Jiemin
+Wu, Jin
+Wu, Jingchao
+Wu, Jinglian
+Wu, Jingzi
+Wu, Juntao
+Wu, Kepi
+Wu, Kong
+Wu, Kwang
+Wu, Mingyu
+Wu, Ningkun
+Wu, Piao
+Wu, Qun'gan
+Wu, Shunjun
+Wu, Tao
+Wu, Tingfang
+Wu, Tsong-shien
+Wu, Tung
+Wu, Wenjin
+Wu, Wenjun
+Wu, Xiao An
+Wu, Xiaochun
+Wu, Xing
+Wu, Xiufen
+Wu, Xun
+Wu, Yi
+Wu, Yiming
+Wu, Ying-hua
+Wu, Yuanfang
+Wu, Yuzhang
+Wu, Zhang
+Wu, Zhengyi
+Wu, Zhou
+Xia, Guang
+Xia, Guoping
+Xia, Hong
+Xia, Jian-Bai
+Xia, Nai
+Xiang, Huaicheng
+Xiang, Mu
+Xiang, Ying
+Xiang, Zhang
+XIAOBO, LU
+Xiao, Cheng
+Xiao, Fan
+Xiao, Fei
+Xiao, Han
+Xiao, Hong
+Xiao, Jimei
+Xiao, Ke
+Xiaoli, Sun
+Xiao, Ma
+Xiaoming, Zhang
+Xiao, Qian
+Xiao, Qin
+XIAO, QIN
+Xiao, Shiling
+Xiao, Yan
+Xiao, Yang
+Xiao, Yanling
+Xiao, Zhang
+Xia, Yang
+Xia, Yi
+Xie, Fei
+Xie, Jialin
+Xie, Jin
+Xie, Jinyuan
+Xie, Juezai
+Xie, Jun
+Xie, Kai
+Xie, Qu-bing
+Xie, Xiande
+Xie, Xide
+Xie, Yu-Zhang
+Xie, Zheng
+Xie, Zhufan
+Xi, Gao
+Ximen, Jiye
+Xin, Gao
+Xing, Huo-yu
+Xing, Lin
+Xing, Lu
+Xing, Lujian
+Xing, Shu
+Xin, Hua
+XINJIANG, RONG
+Xin, Lu
+Xin, Mu
+Xin, Tian
+Xin, Wen
+Xin, Ying
+Xin, Zheng
+Xiong, Fan
+Xiong, Qinglai
+Xiu, Yu
+Xi, Zhang
+Xuan, Wu
+Xu, Beihong
+Xu, Bing
+Xu, Dan
+XU, DAN
+Xu, Dixin
+Xue, Hanqin
+Xue, Jianxin
+Xue, Yu
+Xu, Gan
+Xu, Guangqi
+Xu, Guohua
+Xu, Hong-yan
+Xu, Hong Yan
+Xu, Huping
+Xu, Jian
+Xu, Jianchu
+Xu, Jiawei
+Xu, Jiazhong
+Xu, Jincheng
+Xu, Liangying
+Xu, Meng
+Xu, Mengzhong
+Xu, Ming
+Xun, Lin
+Xun, Zhao
+Xu, Qian
+Xu, Senlin
+xu, Shen
+Xu, Shichang
+Xu, Weiguo
+Xu, Wen
+Xu, Xi
+Xu, Xian
+Xu, Xianquan
+Xu, Xiaoge
+Xu, Xiaojie
+Xu, Xing
+Xu, Xuchang
+Xu, Yihou
+Xu, Yuanzhong
+Xu, Yuhuan
+Xu, Yunlong
+Xu, Zhaoran
+Xu, Zhu
+Yan, Chongnian
+Yan, Fu
+Yang, Bo
+Yang, Chao
+Yang, Chen
+Yang, Chengwu
+Yang, Dadi
+Yang, Dao
+Yang, Fang
+Yang, Fu
+Yang, Fudong
+Yang, Hanxi
+Yang, Hongyuan
+Yang, Hsiao
+Yang, Huan
+Yang, Hui
+Yang, Huizhong
+Yang, Jiasan
+Yang, Jing
+Yang, Jinghui
+Yang, Jingyu
+Yang, Jizhou
+Yang, Kaizhong
+Yang, Ke
+Yang, Lan
+Yang, Liping
+Yang, Liwei
+Yang, Shangkun
+Yang, Wan-li
+Yang, Weitao
+Yang, Wenyi
+Yang, Wenzhen
+Yang, Xian
+Yang, Xiao
+Yang, Xiaojun
+Yang, Xiaoqing
+Yang, Xiguang
+Yang, Xinrong
+Yang, Yin
+Yang, Ying
+Yang, Yi Xian
+Yang, Yi-yen
+Yang, Yongjian
+Yang, Yu
+Yang, Yu?
+Yang, Zenghong
+Yang, Zhensheng
+Yang, Zhi-jun
+Yang, Zhu
+Yang, Zi
+Yan, Han
+Yan, Hong
+Yan, Jian
+Yan, Jiaqi
+Yan, Kejia
+Yan, Menghui
+Yan, Pei-Ming
+Yan, Ruizhen
+Yan, Shang
+Yan, Sun
+Yan, Wang
+Yan, Wei
+Yan, Xin
+Yan, Xingjian
+Yan, Xuetong
+Yan, Yixun
+Yan, Yu
+Yan, Zhen'guo
+Yao, Chang
+Yao, Dianfang
+Yao, Fu
+Yao, Huang
+Yao, Li
+Yao, Ming
+Yao, Qian
+Yao, Suihan
+Yao, Wang
+Yao, Wenyuan
+Yao, Zhang
+Yau, Ching
+Ye, Bai
+Ye, Duzheng
+Ye, Jianying
+Ye, Jin
+Ye, Lin-Sheng
+Ye, Minghan
+Yen, Chia-kan
+Yen, Hsi-shan
+Yen, Ping-Chiu
+Yen, Wei
+Yen, Wenchun
+Ye, Ping Kuei
+Ye, Sen
+Ye, Su
+Ye, Xiao
+Ye, Zhongxing
+YI, DING
+Yi, Hong
+Yi, Huang
+Yi, Jiang
+Yi, Jin
+Yi, Lu
+Yin, Binyong
+Yin, Chamroeun
+Ying, Guo
+Ying, Jianzhe
+Ying, Lei
+Ying, Lu
+Ying, Lungan
+Ying, Yu
+Yin, Hongfu
+Yin, Huihe
+Yin, Jian
+Yin, Jianxing
+Yin, Shun
+Yi, Peng
+Yi, Sang
+Yi, Su-gwang
+Yi, Ying
+Yi, Zeng
+Yi, Zhongtian
+Yong, Hoi-Sen
+Yong, Kwet Yew
+Yong, Pung How
+Yong, Wang
+Yong, Yan
+Yoon, Choong-Nam
+Yoon, Hyung Kim
+Yoon, Myung-sook
+You, Jia
+You, Mo
+Younglae, Kim
+Young-moo, Kim
+You, Xu
+You, Yu
+Yuan, Chen
+Yuan, Daoxian
+Yuan, Hong
+Yuan, Kang
+Yuan, Longping
+Yuan, Muzhi
+Yuan, Shao Wen
+Yuan, Shen
+Yuan, Shibing
+Yuan, Shikai
+Yuan, Xue
+Yuan, Yu
+Yuan, Yunsheng
+Yu, Bin
+Yu, Chang-Chin
+Yu, Changlong
+Yu, Dan
+Yu, Dejun
+Yu, Dong
+Yue, Chongxi
+Yue, Fengxia
+Yue, Ma
+Yu, Fei
+Yu, Guang
+Yu, Hao
+Yu, He
+Yu, Hsiu-ching
+Yu, Hua
+Yu, Hui-chan
+Yu, Huihua
+Yu, Jing-Yuan
+Yu, Jung-yul
+Yu, Li Ming
+Yu, Lin
+Yu, Maohong
+Yunbo, Liu
+Yung Teng, Chia-yee
+Yun, Kim
+Yun, Ma
+Yun, Mi Antorini
+Yun, Qing
+Yun, Shouping
+Yun, Wu
+Yu, Pingbo
+Yu, Qin
+Yu, Sianglin
+Yu, Sung
+Yu, Tianwei
+Yu, Wei
+Yu, Xiang
+Yu, Xiaohui
+Yu, Xiaoyang
+Yu, Xie
+Yu, Xihan
+Yu, Xuanji
+Yu, Yaosheng
+Yuyi, Wang
+Yu, Young-nan
+Yu, Youren
+Yu, Yuntian
+Yu, Zhang
+Yu, Zhao
+Yu, Zhu
+Yu, Zhuoyun
+Yu, Zicheng
+Zaifu, Liu
+Zeng, Cheng
+Zeng, Fanren
+Zeng, Guofan
+Zeng, Minzu
+Zeng, Weiqi
+Zeng, Xianyi
+Zeng, Zhen
+Zhai, Zhenhua
+Zhang, Bin
+Zhang, Chu
+Zhang, Chun
+Zhang, Dachun
+Zhang, Feng
+Zhang, guohua
+Zhang, Guohua
+Zhang, Hao
+Zhang, Hua
+Zhang, Huan
+Zhang, Junxiang
+Zhang, Min
+Zhang, Nan
+Zhang, Ning
+Zhang, Qian
+Zhang, Rui
+Zhang, Weihong
+Zhang, Xiaoping
+Zhang, Xin
+Zhang, Yanqing
+Zhang, Yuan
+Zhang, Yue
+Zhang, Zhong
+Zhao, Cangbi
+Zhao, Dan
+Zhao, Han
+Zhao, Hong
+Zhao, Jun
+Zhao, Lan
+Zhao, Liang
+Zhao, Lihong
+Zhao, Man
+Zhao, Mengfu
+Zhao, Muying
+Zhao, Qi
+Zhao, Qizheng
+Zhao, Rui
+Zhao, Shuhan
+Zhao, Wei
+Zhao, Xiaolei
+Zhao, Xin
+Zhao, Yan
+Zhao, Yong
+Zhao, Yuqi
+Zhao, Zhentao
+Zhao, Ziyang
+Zheng, Chengsi
+Zheng, Dai
+Zheng, Guangmei
+Zheng, Guili
+Zheng, Guo
+Zheng, Guogu
+Zheng, Guoxiong
+Zheng, Hong
+Zheng, Jie
+Zheng, Jun
+Zheng, Junli
+Zheng, Lizhong
+Zheng, Long
+Zheng, Lu
+Zheng, Mianping
+Zheng, Ping
+Zheng, Qing
+Zheng, Quan
+Zheng, Rusi
+Zheng, Shiling
+Zheng, Tan
+Zheng, Wu
+Zheng, Xiaoxu
+Zhengxin, Chen
+Zheng, Xun
+Zheng, Yangwen
+Zheng, Yide
+Zheng, Yong-Nian
+Zheng, Yulian
+Zheng, Zhao
+Zheng, Zhenman
+Zheng, Zhensun
+Zheng, Zhi
+Zhen, Rong
+Zhen, Yuan
+Zhi, Chen
+Zhi, Feng
+Zhigang, Guo
+Zhiming, Yuan
+Zhi, Yang
+Zhi, Yu
+Zhong, Bai-song
+Zhong, Gongfu
+Zhong, Hong
+Zhong, Jin
+Zhong, Junhua
+Zhongmin, Han
+Zhong, Shizhen
+Zhong, Xiangchong
+Zhong, Xiu
+Zhongyi, Yuan
+Zhong, Zheng
+Zhou, Baozhong
+Zhou, Can
+Zhou, Chuncai
+Zhou, Daguan
+Zhou, Di
+Zhou, Dingzhi
+Zhou, Enlai
+Zhou, Huang
+Zhou, Ji
+Zhou, Jianchao
+Zhou, Jianmin
+Zhou, Jianren
+Zhou, Kaiya
+Zhou, Keqin
+Zhou, Lei
+Zhou, Lingzhong
+Zhou, Lixing
+Zhou, Mi
+Zhou, Nanzhao
+Zhou, Shidi
+Zhou, Siyong
+Zhou, Xiaowen
+Zhou, Xuan
+Zhou, Xun
+Zhou, Yan
+Zhou, Yiming
+Zhou, Yu
+Zhou, Yun
+Zhou, Zhigang 
+Zhou, Zhiyi
+Zhuang, Fenggan
+Zhuang, Li
+Zhuang, Youjuan
+Zhu, Baoxun
+Zhu, Bingyao
+Zhu, Chen
+Zhu, De
+Zhuge, Liang
+Zhu, Guanya
+Zhu, Guobin
+Zhu, Hongda
+Zhu, Huayou
+Zhu, Jiajin
+Zhu, Jianhua
+Zhu, Jie
+Zhu, Junyi
+Zhu, Liang
+Zhu, Meilin
+Zhu, Miaolong
+Zhuo, Huang
+Zhuo, Jing-Schmidt
+Zhu, Qi
+Zhu, Qianzhi
+Zhu, Qiuxia
+Zhu, Rizhang
+Zhu, Rongji
+Zhu, Shanan
+Zhu, shenghao
+Zhu, Shenghao
+Zhu, Shijie
+Zhu, Tingcheng
+Zhu, Xian
+Zhu, Xiao Di
+Zhu, Xiaodong
+Zhu, Xuan
+Zhu, Yao
+Zhu, Zhengming
+Zou, Rong
+Zuo, Boyang
+Zuo, Qiuming
+Zuo, Zongtang
diff --git a/ia-legacy-importer/author/list_titles.py b/ia-legacy-importer/author/list_titles.py
new file mode 100644
index 00000000..bc36cfd2
--- /dev/null
+++ b/ia-legacy-importer/author/list_titles.py
@@ -0,0 +1,24 @@
+from __future__ import print_function
+titles = {}
+with_title = {}
+
+for line in open("/1/pharos/edward/titles"):
+    try:
+        loc, fields = eval(line)
+    except SyntaxError:
+        break
+    except ValueError:
+        continue
+    t = [b for a, b in fields if a == 'c']
+    if len(t) != 1:
+        continue
+    fields = tuple((a, b.strip('.') if a=='d' else b) for a, b in fields)
+    title = t[0].strip(' ,.').lower()
+    titles[title] = titles.get(title, 0) + 1
+    with_title.setdefault(title, {})
+    with_title[title][fields] = with_title[title].get(fields, 0) + 1
+
+for k, v in sorted(((a, b) for a, b in titles.items() if b > 10), reverse=True, key=lambda x: x[1]):
+    print((repr(k), v))
+    for a, b in sorted(((a, b) for a, b in with_title[k].items() if b > 5), reverse=True, key=lambda x: x[1])[0:30]:
+        print(('  ', a, b))
\ No newline at end of file
diff --git a/ia-legacy-importer/author/marc.py b/ia-legacy-importer/author/marc.py
new file mode 100644
index 00000000..4b0a1542
--- /dev/null
+++ b/ia-legacy-importer/author/marc.py
@@ -0,0 +1,47 @@
+from __future__ import print_function
+from catalog.infostore import get_site
+from catalog.marc.db.web_marc_db import search_query
+from catalog.get_ia import get_data
+from catalog.marc.fast_parse import get_all_subfields, get_tag_lines, get_first_tag, get_subfields
+import sys
+site = get_site()
+
+name = sys.argv[1] # example: 'Leonardo da Vinci'
+author_keys = site.things({'type': '/type/author', 'name': name})
+print(len(author_keys), 'authors found')
+
+edition_keys = set()
+for ak in author_keys:
+    edition_keys.update(site.things({'type': '/type/edition', 'authors': ak}))
+print(len(edition_keys), 'editions found')
+
+locs = set()
+for ek in edition_keys:
+    e = site.withKey(ek)
+    for i in e.isbn_10 if e.isbn_10 else []:
+        locs.update(search_query('isbn', i))
+    for i in e.lccn if e.lccn else []:
+        locs.update(search_query('lccn', i))
+    for i in e.oclc_numbers if e.oclc_numbers else []:
+        locs.update(search_query('oclc', i))
+print(len(locs), 'MARC records found')
+
+def ldv(line):
+    for s in ('1452', '1519', 'eonard', 'inci'):
+        if line.find(s) != -1:
+            return True
+    return False
+
+for loc in locs:
+#    print loc
+    data = get_data(loc)
+    if not data:
+        print("couldn't get")
+        continue
+    line = get_first_tag(data, set(['100', '110', '111']))
+    if line and ldv(line):
+        print(list(get_all_subfields(line)))
+
+    line = get_first_tag(data, set(['700', '710', '711']))
+    if line and ldv(line):
+        print(list(get_all_subfields(line)))
diff --git a/ia-legacy-importer/author/merge.py b/ia-legacy-importer/author/merge.py
new file mode 100755
index 00000000..c2ad310f
--- /dev/null
+++ b/ia-legacy-importer/author/merge.py
@@ -0,0 +1,220 @@
+# -*- coding: utf-8 -*-
+from __future__ import print_function
+from openlibrary.catalog.importer.db_read import withKey, get_things, get_mc
+from openlibrary.catalog.read_rc import read_rc
+from openlibrary.catalog.utils import key_int, match_with_bad_chars, pick_best_author, remove_trailing_number_dot
+from unicodedata import normalize
+import web
+import re
+import sys
+import codecs
+
+import six
+from six.moves import urllib
+
+sys.path.append('/home/edward/src/olapi')
+from olapi import OpenLibrary, unmarshal, Reference
+from openlibrary.catalog.utils.edit import fix_edition
+from openlibrary.catalog.utils.query import query_iter
+
+def urlread(url):
+    return urllib.request.urlopen(url).read()
+
+def norm(s):
+    return normalize('NFC', s)
+
+def copy_fields(from_author, to_author, name):
+    new_fields = { 'name': name, 'personal_name': name }
+    for k, v in from_author.iteritems():
+        if k in ('name', 'personal_name', 'key', 'last_modified', 'type', 'id', 'revision'):
+            continue
+        if k in to_author:
+            assert v == to_author[k]
+        else:
+            new_fields[k] = v
+    return new_fields
+
+def test_copy_fields():
+    f = {'name': 'Sheila K. McCullagh', 'personal_name': 'Sheila K. McCullagh', 'last_modified': {'type': '/type/datetime', 'value': '2008-08-30 20:40:41.784992'}, 'key': '/a/OL4340365A', 'birth_date': '1920', 'type': {'key': '/type/author'}, 'id': 18087251, 'revision': 1}
+    t = {'name': 'Sheila K. McCullagh', 'last_modified': {'type': '/type/datetime', 'value': '2008-04-29 13:35:46.87638'}, 'key': '/a/OL2622088A', 'type': {'key': '/type/author'}, 'id': 9890186, 'revision': 1}
+
+    assert copy_fields(f, t, 'Sheila K. McCullagh') == {'birth_date': '1920', 'name': 'Sheila K. McCullagh', 'personal_name': 'Sheila K. McCullagh'}
+
+
+def update_author(key, new):
+    q = { 'key': key, }
+    for k, v in new.iteritems():
+        q[k] = { 'connect': 'update', 'value': v }
+    print(ol.write(q, comment='merge author'))
+
+def update_edition(ol, e, old, new, debug=False):
+    key = e['key']
+    if debug:
+        print('key:', key)
+        print('old:', old)
+        print('new:', new)
+    fix_edition(key, e, ol)
+    authors = []
+    if debug:
+        print('current authors:', e['authors'])
+    for cur in e['authors']:
+        cur = cur['key']
+        if debug:
+            print(old, cur in old)
+        a = new if cur in old else cur
+        if debug:
+            print(cur, '->', a)
+        if a not in authors:
+            authors.append(a)
+    if debug:
+        print('authors:', authors)
+    e['authors'] = [{'key': a} for a in authors]
+
+    try:
+        ret = ol.save(key, e, 'merge authors')
+    except:
+        if debug:
+            print(e)
+        raise
+    if debug:
+        print(ret)
+
+    update = []
+    for wkey in e.get('works', []):
+        need_update = False
+        print('work:', wkey)
+        w = ol.get(wkey)
+        for a in w['authors']:
+            if a['author'] in old:
+                a['author'] = Reference(new)
+                need_update = True
+        if need_update:
+            update.append(w)
+
+    if update:
+        ret = ol.save_many(update, 'merge authors')
+
+def switch_author(ol, old, new, other, debug=False):
+    q = { 'authors': old, 'type': '/type/edition', }
+    for e in query_iter(q):
+        if debug:
+            print('switch author:', e['key'])
+        print(e)
+        e = ol.get(e['key'])
+        update_edition(ol, e, other, new, debug)
+
+def make_redirect(ol, old, new):
+    r = {'type': {'key': '/type/redirect'}, 'location': new}
+    ol.save(old, r, 'merge authors, replace with redirect')
+
+re_number_dot = re.compile('\d{2,}[- ]*(\.+)$')
+
+def do_normalize(author_key, best_key, authors):
+    #print "do_normalize(%s, %s, %s)" % (author_key, best_key, authors)
+    need_update = False
+    a = ol.get(author_key)
+    if author_key == best_key:
+        for k, v in a.items():
+            if 'date' in k:
+                m = re_number_dot.search(v)
+                if m:
+                    need_update = True
+                    v = v[:-len(m.group(1))]
+            if not isinstance(v, six.text_type):
+                continue
+            norm_v = norm(v)
+            if v == norm_v:
+                continue
+            a[k] = norm_v
+            need_update = True
+    else:
+        best = ol.get(best_key)
+        author_keys = set(k for k in a.keys() + best.keys() if k not in ('key', 'last_modified', 'type', 'id', 'revision'))
+        for k in author_keys:
+            if k not in best:
+                v = a[k]
+                if not isinstance(v, six.text_type):
+                    continue
+                norm_v = norm(v)
+                if v == norm_v:
+                    continue
+                a[k] = norm_v
+                need_update = True
+                continue
+            v = best[k]
+            if 'date' in k:
+                v = remove_trailing_number_dot(v)
+            if isinstance(v, six.text_type):
+                v = norm(v)
+            if k not in a or v != a[k]:
+                a[k] = v
+                need_update = True
+    if not need_update:
+        return
+    #print 'save(%s, %s)' % (author_key, repr(a))
+    ol.save(author_key, a, 'merge authors')
+
+def has_image(key):
+    url = 'https://covers.openlibrary.org/a/query?olid=' + key[3:]
+    ret = urlread(url).strip()
+    return ret != '[]'
+
+def merge_authors(ol, keys, debug=False):
+#    print 'merge author %s:"%s" and %s:"%s"' % (author['key'], author['name'], merge_with['key'], merge_with['name'])
+#    print 'becomes: "%s"' % repr(new_name)
+    authors = [a for a in (withKey(k) for k in keys) if a['type']['key'] != '/type/redirect']
+    not_redirect = set(a['key'] for a in authors)
+    if debug:
+        for a in authors:
+            print(a)
+
+    assert all(a['type']['key'] == '/type/author' for a in authors)
+    name1 = authors[0]['name']
+    for a in authors:
+        print(repr(a['key'], a['name']))
+    assert all(match_with_bad_chars(a['name'], name1) for a in authors[1:])
+
+    best_key = pick_best_author(authors)['key']
+
+    imgs = [a['key'] for a in authors if a['key'] != '/a/OL2688880A' and has_image(a['key'])]
+    if len(imgs) == 1:
+        new_key = imgs[0]
+    else:
+        new_key = "/a/OL%dA" % min(key_int(a) for a in authors)
+        # Molière and O. J. O. Ferreira
+        if len(imgs) != 0:
+            print('imgs:', imgs)
+            return # skip
+        if not (imgs == [u'/a/OL21848A', u'/a/OL4280680A'] \
+                or imgs == [u'/a/OL325189A', u'/a/OL266422A'] \
+                or imgs == [u'/a/OL5160945A', u'/a/OL5776228A']):
+            print(imgs)
+            assert len(imgs) == 0
+
+    print(new_key)
+    print(best_key)
+
+    do_normalize(new_key, best_key, authors)
+    old_keys = set(k for k in keys if k != new_key)
+    print('old keys:', old_keys)
+
+    for old in old_keys:
+        # /b/OL21291659M
+        switch_author(ol, old, new_key, old_keys, debug=True)
+        if old in not_redirect:
+            make_redirect(ol, old, new_key)
+        q = { 'authors': old, 'type': '/type/edition', }
+        if list(get_things(q)) != []:
+            switch_author(ol, old, new_key, old_keys, debug=True)
+        #l = list(query_iter(q))
+        #print old, l
+        #assert l == []
+
+if __name__ == '__main__':
+    sys.stdout = codecs.getwriter('utf-8')(sys.stdout)
+
+    rc = read_rc()
+    ol = OpenLibrary("http://openlibrary.org")
+    ol.login('EdwardBot', rc['EdwardBot'])
+    assert len(sys.argv) > 2
+    merge_authors(ol, sys.argv[1:])
diff --git a/ia-legacy-importer/author/new.py b/ia-legacy-importer/author/new.py
new file mode 100644
index 00000000..71a2eff9
--- /dev/null
+++ b/ia-legacy-importer/author/new.py
@@ -0,0 +1,21 @@
+from __future__ import print_function
+from catalog.olwrite import Infogami
+from catalog.read_rc import read_rc
+import sys
+
+rc = read_rc()
+infogami = Infogami(rc['infogami'])
+infogami.login('EdwardBot', rc['EdwardBot'])
+
+name = sys.argv[1]
+
+q = {
+    'create': 'unless_exists',
+    'name': name,
+    'personal_name': name,
+    'entity_type': 'person',
+    'key': infogami.new_key('/type/author'),
+    'type': '/type/author',
+}
+
+print(infogami.write(q, comment='create author'))
diff --git a/ia-legacy-importer/author/noble.py b/ia-legacy-importer/author/noble.py
new file mode 100644
index 00000000..5b1ac9e9
--- /dev/null
+++ b/ia-legacy-importer/author/noble.py
@@ -0,0 +1,71 @@
+# coding=utf-8
+from __future__ import print_function
+from catalog.get_ia import read_marc_file
+from catalog.read_rc import read_rc
+from time import time
+from catalog.marc.fast_parse import index_fields, get_tag_lines, get_first_tag, get_all_subfields
+import web
+import os
+import os.path
+import re
+import sys
+
+titles = [ "Accolade", "Adi", "Aetheling", "Aga Khan", "Ajaw", "Ali'i",
+        "Allamah", "Altgrave", "Ammaveedu", "Anji", "Ryūkyū", "Archtreasurer",
+        "Aryamehr", "Atabeg", "Ban", "Baron", "Batonishvili", "Begum", "Bey",
+        "Boier", "Boyar", "Bulou", "Burgmann", "Buring Khan", "Caliph",
+        "Castellan", "Chakravatin", "Comte", "Conde", "Count",
+        "Count palatine", "Countess", "Crown prince", "Daula",
+        "Despot", "Doge", "Dowager", "Duchess of Rothesay", "Duke", "Earl",
+        "Edler", "Elector", "Elteber", "Emir", "Emperor", "Emperor-elect",
+        "Erbherr", "Feudal baron", "Fils de France", "Fraujaz", "Fürst",
+        "Grand duke", "Grand prince", "Grand Župan", "Grandee", "Haty-a",
+        "Hersir", "Hidalgo", "Highness", "Hold", "Hteik Tin", "Ichirgu-boil",
+        "Infante", "Jang", "Jarl", "Jonkheer", "Junker", "Kavkhan", "Khagan",
+        "Khagan Bek", "Khan", "Khanum", "Khatun", "Knight", "Knyaz",
+        "Kodaw-gyi", "Kralj", "Lady", "Lamido", "Landgrave", "Lendmann",
+        "Lord", "Madame Royale", "Magnate", "Maha Uparaja",
+        "Maha Uparaja Anaudrapa Ainshe Min", "Maharaja", "Maharajadhiraja",
+        "Maharana", "Maharao", "Maharaol", "Malik", "Margrave", "Marquess",
+        "Marquis de Bauffremont", "Marquise", "Mepe-Mepeta", "Mesne lord",
+        "Mian", "Min Ye", "Min-nyi Min-tha", "Mir", "Mirza", "Monsieur", "Mormaer", "Morza", "Mwami", "Naib", "Nawab", "Nayak", "Negus", "Nobile", "Obalumo", "Orangun", "Aftab", "Ottoman", "Padishah", "Paigah", "Hyderabad", "Paladin", "Palaiyakkarar", "Palatine", "Panapillai Amma", "Paramount Ruler", "Pasha", "Patricianship", "Pharaoh", "Piast dynasty", "Prescriptive barony", "Prince", "Prince du Sang", "Prince-Bishop", "Princely Highness", "Princeps", "Princess", "Principalía", "Privy chamber", "Rai", "Raja", "Rajah Muda of Sarawak", "Rajus", "Rana", "Rao Raja", "Ratu", "Ridder", "Ro", "Roko", "Sado Min", "Sahib", "Samanta", "Sawai Maharaja", "Shah", "Shahzada", "Shamkhal", "Shanyu", "Shwe Kodaw-gyi", "Shwe Kodaw-gyi Awratha", "Shwe Kodaw-gyi Rajaputra", "Sidi", "Sir", "Sultan", "Sunan", "Susuhunan", "Szlachta", "Tenant-in-chief", "Thakur", "Thampi", "Tsar", "Tsarevitch", "Tu'i", "Ueekata", "Uparaja", "Uparat", "Viceroy", "Victory", "Vidame", "Viscount", "Vizier", "Wazirzada", "Yang di-Pertuan Besar", "Zamindar", "Zeman", "Župa"]
+
+rc = read_rc()
+web.config.db_parameters = dict(dbn='postgres', db='ol_merge', user=rc['user'], pw=rc['pw'], host=rc['host'])
+web.config.db_printing = False
+web.load()
+
+def sources():
+    return ((i.id, i.archive_id, i.name) for i in web.select('marc_source'))
+
+def process_record(pos, loc, data):
+    for tag in '100', '700':
+        line = get_first_tag(data, set([tag]))
+        if line:
+            fields = list(get_all_subfields(line))
+            if any(k == 'c' for k, v in fields):
+                print((loc, fields))
+
+def files(ia):
+    endings = ['.mrc', '.marc', '.out', '.dat', '.records.utf8']
+    def good(filename):
+        return any(filename.endswith(e) for e in endings)
+
+    dir = rc['marc_path'] + ia
+    dir_len = len(dir) + 1
+    files = []
+    for dirpath, dirnames, filenames in os.walk(dir):
+        files.extend(dirpath + "/" + f for f in sorted(filenames))
+    return [(i[dir_len:], os.path.getsize(i)) for i in files if good(i)]
+
+rec_no = 0
+
+for source_id, ia, name in sources():
+    for part, size in files(ia):
+        full_part = ia + "/" + part
+        filename = rc['marc_path'] + full_part
+        assert os.path.exists(filename)
+        f = open(filename)
+        for pos, loc, data in read_marc_file(full_part, f):
+            rec_no +=1
+            process_record(pos, loc, data)
diff --git a/ia-legacy-importer/author/rename.py b/ia-legacy-importer/author/rename.py
new file mode 100755
index 00000000..24240575
--- /dev/null
+++ b/ia-legacy-importer/author/rename.py
@@ -0,0 +1,217 @@
+#!/usr/bin/python
+
+from __future__ import print_function
+import web
+import re
+import sys
+import codecs
+
+sys.stdout = codecs.getwriter('utf-8')(sys.stdout)
+
+web.load()
+
+from infogami.infobase.infobase import Infobase
+import infogami.infobase.writequery as writequery
+site = Infobase().get_site('openlibrary.org')
+
+re_marc_name = re.compile('^(.*), (.*)$')
+re_end_dot = re.compile('[^ ][^ ]\.$', re.UNICODE)
+re_odd_dot = re.compile('[^ ][^ ]\. ', re.UNICODE)
+re_initial_then_dot = re.compile(r'\b[A-Z]\.')
+
+def find_by_statements(author_key):
+    q = {
+        'authors': author_key,
+        'type': '/type/edition',
+    }
+    by = []
+    for key in site.things(q):
+        try:
+            by.append(site.withKey(key).by_statement.value)
+        except AttributeError:
+            pass
+    return by
+
+def east_in_by_statement(name, flipped, by_statements):
+    assert name.find(', ') != -1
+    name = name.replace('.', '')
+    name = name.replace(', ', ' ')
+    if name == flipped.replace('.', ''):
+        return False
+    for by in by_statements:
+        if by.find(name) != -1:
+            return True
+    return False
+
+def get_type_id(type):
+    w = "key='" + type + "' and site_id=1"
+    return web.select('thing', what='id', where=w)[0].id
+
+author_type_id = get_type_id('/type/author')
+
+def get_thing(id):
+    sql = "select key, value from datum where thing_id=%d and end_revision=2147483647 and key != 'type'" % id
+    iter = web.query(sql)
+    thing = {}
+    for row in iter:
+        thing[row.key] = row.value
+    return thing
+
+def get_author_by_name(name):
+    sql = "select id from thing, datum where thing.type=$type and thing.id=thing_id and datum.key='name' and datum.value=$name and datum.datatype=2 and datum.end_revision=2147483647"
+    iter = web.query(sql, vars={'name': name, 'type': author_type_id})
+    return [row.id for row in iter]
+
+def flip_name(name):
+    # strip end dots like this: "Smith, John." but not like this: "Smith, J."
+    m = re_end_dot.search(name)
+    if m:
+        name = name[:-1]
+
+    m = re_marc_name.match(name)
+    return m.group(2) + ' ' + m.group(1)
+
+def pick_name(a, b, flipped):
+    if re_initial_then_dot.search(a):
+        return flipped
+    else:
+        return b
+
+east_list = [line[:-1].lower() for line in open("east")]
+east = frozenset(east_list + [flip_name(i) for i in east_list])
+
+def author_dates_match(a, b):
+    for k in ['birth_date', 'death_date', 'date']:
+        if k in a and k in b and a[k] != b[k]:
+            return False
+    return True
+
+def get_other_authors(name):
+    other = get_author_by_name(name)
+    if name.find('.') != -1:
+        name = name.replace('.', '')
+        other.extend(get_author_by_name(name))
+    return other
+
+def key_int(rec):
+    return int(web.numify(rec['key']))
+
+def switch_author(old, new):
+    q = { 'authors': old['key'], 'type': '/type/edition', }
+    for key in site.things(q):
+        edition = site.withKey(key)
+        authors = []
+        for author in edition.authors:
+            if author.key == old['key']:
+                author_key = new['key']
+            else:
+                author_key = author.key
+            authors.append({ 'key': author_key })
+
+        q = {
+            'key': key,
+            'authors': { 'connect': 'update_list', 'value': authors }
+        }
+        site.write(q, comment='fix author name')
+
+def make_redirect(old, new):
+    q = {
+        'key': old['key'],
+        'location': {'connect': 'update', 'value': new['key'] },
+        'type': {'connect': 'update', 'value': '/type/redirect' },
+    }
+    for k in old.iterkeys():
+        if k != 'key':
+            q[str(k)] = { 'connect': 'update', 'value': None }
+    print(site.write(q, comment='replace with redirect'))
+
+def copy_fields(from_author, to_author, name):
+    new_fields = { 'name': name, 'personal_name': name }
+    for k, v in from_author.iteritems():
+        if k in ('name', 'key'):
+            continue
+        if k in author:
+            assert v == to_author[k]
+        else:
+            new_fields[k] = v
+    return new_fields
+
+def update_author(key, new):
+    q = { 'key': key, }
+    for k, v in new.iteritems():
+        q[k] = { 'connect': 'update', 'value': v }
+    print(site.write(q, comment='fix author name'))
+
+def merge_authors(author, merge_with, name):
+    print('merge author %s:"%s" and %s:"%s"' % (author['key'], author['name'], merge_with['key'], merge_with['name']))
+    new_name = pick_name(author['name'], merge_with['name'], name)
+    print('becomes: "%s"' % new_name)
+    if key_int(author) < key_int(merge_with):
+        new_key = author['key']
+        print("copy fields from merge_with to", new_key)
+        new = copy_fields(merge_with, author, new_name)
+        update_author(new_key, new)
+        switch_author(merge_with, author)
+#        print "delete merge_with"
+        make_redirect(merge_with, author)
+    else:
+        new_key = merge_with['key']
+        print("copy fields from author to", new_key)
+        new = copy_fields(merge_with, author, new_name)
+        update_author(new_key, new)
+        switch_author(author, merge_with)
+#        print "delete author"
+        make_redirect(author, merge_with)
+    print()
+
+print('running query')
+# limit for test runs
+for thing_row in web.select('thing', what='id, key', where='type='+repr(author_type_id), limit=10000):
+    id = thing_row.id
+    author = get_thing(id)
+
+    if 'personal_name' not in author \
+            or author['personal_name'] != author['name']:
+        continue
+    if author['name'].find(', ') == -1:
+        continue
+    if author['name'].lower().replace('.', '') in east:
+        continue
+
+    key = author['key']
+    name = flip_name(author['name'])
+    other = get_other_authors(name)
+    if len(other) == 0 and not re_odd_dot.search(author['name']):
+        by_statements = find_by_statements(author['key'])
+        print(author['name'], "by:", ', '.join('"%s"' % i for i in by_statements))
+        if east_in_by_statement(author['name'], name, by_statements):
+            print("east in by statement")
+            continue
+        print("rename %s to %s" % (repr(author['name']), repr(name)))
+        q = {
+            'key': key,
+            'name': { 'connect': 'update', 'value': name},
+            'personal_name': { 'connect': 'update', 'value': name},
+        }
+        print(repr(q))
+        continue
+
+    if len(other) != 1:
+#        print "other length:", other
+        continue
+    # don't merge authors when more than one like "Smith, John"
+    if len(get_author_by_name(author['name'])) > 1:
+#        print "found more authors with same name"
+        continue
+
+    merge_with = get_thing(other[0])
+    if not author_dates_match(author, merge_with):
+        print("date mismatch")
+        continue
+    by_statements = find_by_statements(author['key'])
+    print(author['name'], "by:", ', '.join('"%s"' % i for i in by_statements))
+    if east_in_by_statement(author['name'], name, by_statements):
+        print("east in by statement")
+        print()
+        continue
+    merge_authors(author, merge_with, name)
diff --git a/ia-legacy-importer/author/utils.py b/ia-legacy-importer/author/utils.py
new file mode 100644
index 00000000..b8534738
--- /dev/null
+++ b/ia-legacy-importer/author/utils.py
@@ -0,0 +1,51 @@
+import re
+
+re_marc_name = re.compile('^(.*), (.*)$')
+re_initial_then_dot = re.compile(r'\b[A-Z]\.')
+
+def flip_name(name):
+    m = re_marc_name.match(name)
+    return m.group(2) + ' ' + m.group(1)
+
+def pick_name(a, b):
+    if re_initial_then_dot.search(a):
+        return flip_name(a)
+    else:
+        return b
+
+def east_in_by_statement(name, by_statements):
+    assert name.find(', ') != -1
+    name = name.replace('.', '')
+    flipped = flip_name(name)
+    name = name.replace(', ', ' ')
+    if name == flipped:
+        return False
+    for by in by_statements:
+        if by.find(name) != -1:
+            return True
+    return False
+
+def test_merge():
+    data = [
+        (u'Hood, Christopher', u'Christopher Hood', u'Christopher Hood'),
+        (u'Pawsey, Margaret M.', u'Margaret M Pawsey', u'Margaret M. Pawsey'),
+        (u'Elchardus, M.', u'M Elchardus', u'M. Elchardus'),
+        (u'Hayes, Mike.', u'Mike Hayes', u'Mike Hayes'),
+        (u'Krause, Rainer.', u'Rainer Krause', u'Rainer Krause'),
+        (u'Hoffmann, Manfred.', u'Manfred Hoffmann', u'Manfred Hoffmann'),
+        (u'Masson, Veneta.', u'Veneta Masson', u'Veneta Masson'),
+        (u'Baker, Ernest.', u'Ernest Baker', u'Ernest Baker'),
+        (u'Hooper, James.', u'James Hooper', u'James Hooper'),
+        (u'Bront\xeb, Charlotte', u'Charlotte Bront\xeb', u'Charlotte Bront\xeb'),
+        (u'Nichols, Francis Henry', u'Francis Henry Nichols', u'Francis Henry Nichols'),
+        (u'Becker, Bernd', u'Bernd Becker', u'Bernd Becker'),
+        (u'Sadleir, Richard.', u'Richard Sadleir', u'Richard Sadleir'),
+    ]
+    for a, b, want in data:
+        assert pick_name(a, b) == want
+
+    assert east_in_by_statement("Wang, Qi", ["Wang Qi."])
+    assert not east_in_by_statement("Walker, Charles L.",\
+            ["edited by A. Karl Larson and Katharine Miles Larson."])
+    assert not east_in_by_statement("Luoma, Gary A.", ["Gary A. Luoma"])
+    assert not east_in_by_statement("Tan, Tan", ["Tan Tan zhu.", "Tan Tan zhu.", "Tan Tan ; [cha tu Li Ruguang ; ze ren bian ji Wang Zhengxiang]."])
diff --git a/ia-legacy-importer/author/web_merge.py b/ia-legacy-importer/author/web_merge.py
new file mode 100644
index 00000000..7cb203bf
--- /dev/null
+++ b/ia-legacy-importer/author/web_merge.py
@@ -0,0 +1,48 @@
+from __future__ import print_function
+import web
+from catalog.db_read import withKey
+from pprint import pformat
+
+urls = (
+    '/', 'index'
+)
+
+base = 'http://openlibrary.org'
+
+class index:
+    def GET(self):
+        web.header('Content-Type','text/html; charset=utf-8', unique=True)
+        input = web.input()
+        print("<html>\n<head><title>Author merge</title></head><body>")
+        print("<h1>Author merge</h1>")
+        print('<form name="main" method="get">')
+        print('<table>')
+        print('<tr><td>Authors</td>')
+        author = {}
+        for field in ('a', 'b'):
+            print('<td>')
+            if field in input:
+                key = input[field]
+                if key.startswith(base):
+                    key = key[len(base):]
+                author[field] = withKey(key)
+                print('<input type="text" name="%s" value="%s">' % (field, key))
+            else:
+                print('<input type="text" name="%s">' % field)
+            print('</td>')
+        print('<td><input type="submit" value="Load"></td>')
+        print('</tr>')
+        if 'a' in author and 'b' in author:
+            a = author['a']
+            b = author['b']
+            keys = [withKey(prop['key'])['name'] for prop in withKey('/type/author')['properties']]
+            for k in keys:
+                if k in a or k in b:
+                    print('<tr><td>%s</td><td>%s</td><td>%s</td></tr>' % \
+                            (k, a.get(k, ''), b.get(k, '')))
+        print('</table>')
+        print("</body></html>")
+
+web.webapi.internalerror = web.debugerror
+
+if __name__ == "__main__": web.run(urls, globals(), web.reloader)
diff --git a/ia-legacy-importer/author/web_merge2.py b/ia-legacy-importer/author/web_merge2.py
new file mode 100644
index 00000000..482dca4a
--- /dev/null
+++ b/ia-legacy-importer/author/web_merge2.py
@@ -0,0 +1,100 @@
+import web
+import re
+import simplejson as json
+from pprint import pformat
+
+from catalog.utils.query import query_iter
+
+from six.moves.urllib.request import urlopen
+
+
+urls = (
+    '/', 'index'
+)
+app = web.application(urls, globals())
+
+re_year = re.compile('^(\d+)[,.*]+$')
+
+def result_table(data, birth, death, order):
+    html = ' %d results' % len(data)
+    l = []
+    def clean(i, default, field):
+        if field not in i:
+            return default
+        if i[field] is None:
+            return ''
+        m = re_year.match(i[field])
+        return m.group(1) if m else i[field]
+
+    data = [
+        {
+            'key': i['key'],
+            'name': i['name'],
+            'birth': clean(i, birth, 'birth_date'),
+            'death': clean(i, death, 'death_date'),
+        } for i in data]
+
+    base_url = web.htmlquote("?birth=%s&death=%s&order=" % (web.urlquote(birth), web.urlquote(death)))
+    html += '<tr>'
+    html += '<th><a href="' + base_url + 'name">Name</a></th>'
+    if birth:
+        html += '<th>birth</th>'
+    else:
+        html += '<th><a href="' + base_url + 'birth">birth</a></th>'
+    if death:
+        html += '<th>death</th>'
+    else:
+        html += '<th><a href="' + base_url + 'death">death</a></th>'
+    html += '</tr>'
+    if order:
+        data = sorted(data, key=lambda i:i[order])
+    for i in data:
+        html += '<tr><td><a href="http://openlibrary.org%s">%s</td><td>%s</td><td>%s</td><tr>' % (i['key'], web.htmlquote(i['name']), i['birth'], i['death'])
+    return '<table>' + html + '</table>'
+
+def get_all(url):
+    all = []
+    offset = 0
+    limit = 500
+    while True:
+        ret = json.load(urlopen(url + "&limit=%d&offset=%d" % (limit, offset)))
+        if not ret:
+            return all
+        all += ret
+        if len(all) >= 1000:
+            return all
+        offset += limit
+
+class index:
+    def GET(self):
+        input = web.input()
+        birth = input.get('birth', '').strip()
+        death = input.get('death', '').strip()
+        order = input.get('order', '').strip()
+        if order not in ('', 'name', 'birth', 'death'):
+            order = ''
+        html = '''
+<html>
+<head>
+<meta http-equiv="content-type" content="text/html; charset=UTF-8">
+<title>Merge author</title>
+<style>
+body { font-family: arial,helvetica,san-serif; }
+th { text-align: left; }
+</style>
+</head>
+<body>
+'''
+        html += '<form method="get">\n'
+        html += 'Birth: <input type="text" size="7" name="birth" value="%s">\n' % web.htmlquote(birth)
+        html += 'Death: <input type="text" size="7" name="death" value="%s">\n' % web.htmlquote(death)
+        html += '<input type="submit" value="Search">\n</form>'
+
+        if birth or death:
+            url = 'http://openlibrary.org/query.json?type=/type/author&birth_date=%s&death_date=%s&name=' % (web.urlquote(birth), web.urlquote(death))
+            data = get_all(url)
+            html += result_table(data, birth, death, order)
+        return html + '</body>\n</html>'
+
+if __name__ == "__main__":
+    app.run()
diff --git a/ia-legacy-importer/crawl/catalogue.nla.gov.au/crawl.py b/ia-legacy-importer/crawl/catalogue.nla.gov.au/crawl.py
new file mode 100644
index 00000000..ee187057
--- /dev/null
+++ b/ia-legacy-importer/crawl/catalogue.nla.gov.au/crawl.py
@@ -0,0 +1,107 @@
+from __future__ import print_function
+import re
+from os.path import exists
+
+from six.moves.urllib.request import urlopen
+
+
+# crawl catalogue.nla.gov.au
+
+re_th = re.compile('^<th nowrap align="RIGHT" valign="TOP">(\d{3})</th>$', re.I)
+re_td = re.compile('^<td(?: VALIGN="TOP")?>(.*)</td>$')
+re_span = re.compile('<span class="subfield"><strong>\|(.|&(?:gt|lt|amp);)</strong>(.*?)</span>')
+
+trans = dict(lt='<', gt='>', amp='&')
+
+def read_row(tag, row):
+    assert len(row) == 3
+    if tag[0:2] == '00':
+        assert all(i == '' for i in row[0:1])
+        return (tag, row[2])
+    else:
+        end = 0
+        subfields = []
+        while end != len(row[2]):
+            m = re_span.match(row[2], end)
+            end = m.end()
+            (k, v) = m.groups()
+            if len(k) != 1:
+                k = trans[k[1:-1]]
+            subfields.append((k, v))
+        assert all(len(i) == 1 for i in row[0:1])
+        return (tag, row[0], row[1], subfields)
+
+def extract_marc(f):
+    expect = 'table'
+    col = 0
+    row = []
+    lines = []
+    for line in f: # state machine
+        if expect == 'table':
+            if '<table border="0" class="librarianview">' in line:
+                expect = 'tr'
+            continue
+        if expect == 'tr':
+            if line.startswith('</table>'):
+                break
+            assert line.startswith('<tr>')
+            expect = 'th'
+            continue
+        if expect == 'th':
+            m = re_th.match(line)
+            assert m
+            tag = m.group(1)
+            expect = 'td'
+            continue
+        if expect == 'td':
+            if line.startswith('</tr>'):
+                lines.append(read_row(tag, row))
+                tag = None
+                row = []
+                expect = 'tr'
+                continue
+            if line == '<td>\n':
+                expect = 'span'
+                continue
+            m = re_td.match(line)
+            row.append(m.group(1))
+            continue
+        if expect == 'span':
+            row.append(line[:-1])
+            expect = '/td'
+            continue
+        if expect == '/td':
+            assert line == '</td>\n'
+            expect = 'td'
+            continue
+    return lines
+
+i = 1
+while True:
+    i+=1
+    filename = 'marc/%d' % i
+    if exists(filename):
+        continue
+    print(i, end=' ')
+    url = 'http://catalogue.nla.gov.au/Record/%d/Details' % i
+    web_input = None
+    for attempt in range(5):
+        try:
+            web_input = urlopen(url)
+            break
+        except:
+            pass
+    if not web_input:
+        break
+
+    out = open('marc/%d' % i, 'w')
+    try:
+        marc = extract_marc(web_input)
+    except:
+        print(url)
+        raise
+    print(len(marc))
+    for line in marc:
+        print(line, file=out)
+    out.close()
+    #sleep(0.5)
diff --git a/ia-legacy-importer/dup/authors.py b/ia-legacy-importer/dup/authors.py
new file mode 100644
index 00000000..657d5680
--- /dev/null
+++ b/ia-legacy-importer/dup/authors.py
@@ -0,0 +1,121 @@
+from __future__ import print_function
+from catalog.infostore import get_site
+from catalog.read_rc import read_rc
+import web
+import sys
+import codecs
+import os.path
+import re
+from catalog.olwrite import Infogami
+site = get_site()
+
+import psycopg2
+rc = read_rc()
+infogami = Infogami(rc['infogami'])
+infogami.login('EdwardBot', rc['EdwardBot'])
+
+re_marc_name = re.compile('^(.*), (.*)$')
+re_end_dot = re.compile('[^ ][^ ]\.$', re.UNICODE)
+
+out = open('author_replace3', 'w')
+
+# find books with matching ISBN and fix them to use better author record
+
+def flip_name(name):
+    # strip end dots like this: "Smith, John." but not like this: "Smith, J."
+    m = re_end_dot.search(name)
+    if m:
+        name = name[:-1]
+
+    m = re_marc_name.match(name)
+    return m.group(2) + ' ' + m.group(1)
+
+conn = psycopg2.connect("dbname='%s' user='%s' host='%s' password='%s'" \
+        % ('ol_merge', rc['user'], rc['host'], rc['pw']));
+cur = conn.cursor()
+
+author_fields = ('key', 'name', 'title', 'birth_date', 'death_date', 'personal_name')
+
+sys.stdout = codecs.getwriter('utf-8')(sys.stdout)
+for line in open('dups'):
+    isbn, num = eval(line)
+    if isbn < '0273314165':
+        continue
+    cur.execute('select key from isbn where value=%(v)s', {'v':isbn})
+    found = []
+    names = {}
+    for i in cur.fetchall():
+        key = i[0]
+        e = site.withKey(key)
+        author_list = e.authors or []
+        authors = [dict(((k, v) for k, v in a._get_data().items() if k in author_fields)) for a in author_list if a]
+        for a in authors:
+            if 'name' not in a:
+                continue
+            name = a['name']
+            if name.find(', ') != -1:
+                name = flip_name(name)
+            a2 = a.copy()
+            a2['edition'] = key
+            names.setdefault(name, []).append(a2)
+        found.append((key, authors))
+    if len([1 for k, a in found if a]) < 2:
+        continue
+    if not any(any('birth_date' in j or 'death_date' in j for j in i[1]) for i in found):
+        continue
+    names = dict((k, v) for k, v in names.iteritems() if len(set(i['key'] for i in v)) > 1)
+    if not names:
+        continue
+    author_replace = {}
+    for name, authors in names.items():
+        seen = set()
+#        print 'birth:', [a['birth_date'].strip('.') for a in authors if 'birth_date' in a]
+#        print 'death:', [a['death_date'].strip('.') for a in authors if 'death_date' in a]
+        with_dates = None
+        no_dates = []
+        for a in authors:
+            if a['key'] in seen:
+                continue
+            seen.add(a['key'])
+            if 'birth_date' in a or 'death_date' in a:
+                if with_dates:
+                    with_dates = None
+                    break
+                with_dates = a['key']
+                continue
+            no_dates.append(a['key'])
+        if with_dates and no_dates:
+            for i in no_dates:
+                assert i not in author_replace
+                author_replace[i] = with_dates
+    if not author_replace:
+        continue
+    print(isbn, author_replace)
+    for key, authors in found:
+        replace = [a['key'] for a in authors if a['key'] in author_replace]
+        if len(replace) == 0:
+            continue
+#        print len(replace), key, [a['key'] for a in authors]
+        new_authors = []
+        this = {}
+        for a in authors:
+            akey = a['key']
+            if akey in author_replace:
+                this[akey] = author_replace[akey]
+                akey = author_replace[akey]
+            if akey not in new_authors:
+                new_authors.append(akey)
+        q = {
+            'key': key,
+            'authors': { 'connect': 'update_list', 'value': new_authors }
+        }
+        print((key, this), file=out)
+#    for k in author_replace.keys():
+#        print k, len(site.things({'type': '/type/edition', 'authors': k}))
+
+#    for name, v in names.items():
+#        print name
+#        for edition, author in v:
+#            print author, site.things({'type': '/type/edition', 'authors': author})
+#    print
+out.close()
diff --git a/ia-legacy-importer/dup/find.py b/ia-legacy-importer/dup/find.py
new file mode 100644
index 00000000..8b227e86
--- /dev/null
+++ b/ia-legacy-importer/dup/find.py
@@ -0,0 +1,76 @@
+from __future__ import print_function
+import web
+import sys
+import codecs
+import os.path
+from catalog.read_rc import read_rc
+import psycopg2
+from catalog.infostore import get_site
+from catalog.merge.merge_marc import attempt_merge, build_marc
+import catalog.marc.fast_parse as fast_parse
+
+sys.stdout = codecs.getwriter('utf-8')(sys.stdout)
+
+# need to use multiple databases
+# use psycopg2 to until open library is upgraded to web 3.0
+
+rc = read_rc()
+threshold = 875
+
+conn = psycopg2.connect("dbname='%s' user='%s' host='%s' password='%s'" \
+        % ('ol_merge', rc['user'], rc['host'], rc['pw']));
+cur1 = conn.cursor()
+cur2 = conn.cursor()
+
+site = get_site()
+
+marc_path = '/2/pharos/marc/'
+
+def get_marc(loc):
+    try:
+        filename, p, l = loc.split(':')
+    except ValueError:
+        return None
+    if not os.path.exists(marc_path + filename):
+        return None
+    f = open(marc_path + filename)
+    f.seek(int(p))
+    buf = f.read(int(l))
+    f.close()
+    rec = fast_parse.read_edition(buf)
+    if rec:
+        return build_marc(rec)
+
+for line in open('dups'):
+    v, num = eval(line)
+    cur2.execute('select key from isbn where value=%(v)s', {'v':v})
+    editions = []
+    for i in cur2.fetchall():
+        key = i[0]
+        t = site.withKey(key)
+        mc =  site.versions({'key': key})[0].machine_comment
+        editions.append({'key': key, 'title': t.title, 'loc': mc})
+    if len(editions) != 2:
+        continue
+    if any(not i['loc'] or i['loc'].startswith('amazon:') for i in editions):
+        continue
+    e1 = get_marc(editions[0]['loc'])
+    if not e1:
+        continue
+    e2 = get_marc(editions[1]['loc'])
+    if not e2:
+        continue
+
+#    print v, [i['title'] for i in editions]
+#    print e1
+#    print e2
+    match = attempt_merge(e1, e2, threshold, debug=False)
+    if match:
+        print(tuple([v] + [i['key'] for i in editions]))
+
+sys.exit(0)
+cur1.execute('select value, count(*) as num from isbn group by value having count(*) > 1')
+for i in cur1.fetchall():
+    print(i)
+    cur2.execute('select key from isbn where value=%(v)s', {'v':i[0]})
+    print(cur2.fetchall())
diff --git a/ia-legacy-importer/edition_merge/find_dups.py b/ia-legacy-importer/edition_merge/find_dups.py
new file mode 100644
index 00000000..e221f2f8
--- /dev/null
+++ b/ia-legacy-importer/edition_merge/find_dups.py
@@ -0,0 +1,40 @@
+#!/usr/bin/python
+
+from __future__ import print_function
+from openlibrary.api import OpenLibrary
+from subprocess import Popen, PIPE
+import MySQLdb
+
+ia_db_host = 'dbmeta.us.archive.org'
+ia_db_user = 'archive'
+ia_db_pass = Popen(["/opt/.petabox/dbserver"], stdout=PIPE).communicate()[0]
+
+ol = OpenLibrary('http://openlibrary.org/')
+
+local_db = MySQLdb.connect(db='merge_editions')
+local_cur = local_db.cursor()
+
+archive_db = MySQLdb.connect(host=ia_db_host, user=ia_db_user, \
+        passwd=ia_db_pass, db='archive')
+archive_cur = archive_db.cursor()
+
+fields = ['identifier', 'updated', 'collection']
+sql_fields = ', '.join(fields)
+
+archive_cur.execute("select " + sql_fields + \
+    " from metadata" + \
+    " where scanner is not null and mediatype='texts'" + \
+        " and (not curatestate='dark' or curatestate is null)" + \
+        " and collection is not null and boxid is not null and identifier not like 'zdanh_test%' and scandate is not null " + \
+        " order by updated")
+
+for num, (ia, updated, collection) in enumerate(archive_cur.fetchall()):
+    if 'lending' not in collection and 'inlibrary' not in collection:
+        continue
+    q = {'type': '/type/edition', 'ocaid': ia}
+    editions = set(str(i) for i in ol.query(q))
+    q = {'type': '/type/edition', 'source_records': 'ia:' + ia}
+    editions.update(str(i) for i in ol.query(q))
+    if len(editions) > 1:
+        print((ia, list(editions)))
+        local_cur.execute('replace into merge (ia, editions) values (%s, %s)', [ia, ' '.join(editions)])
diff --git a/ia-legacy-importer/edition_merge/find_easy.py b/ia-legacy-importer/edition_merge/find_easy.py
new file mode 100644
index 00000000..5cbe5989
--- /dev/null
+++ b/ia-legacy-importer/edition_merge/find_easy.py
@@ -0,0 +1,191 @@
+from __future__ import print_function
+import MySQLdb
+import datetime
+import re
+import sys
+sys.path.append('/1/src/openlibrary')
+from openlibrary.api import OpenLibrary, Reference
+from collections import defaultdict
+
+re_edition_key = re.compile('^/books/OL(\d+)M$')
+re_nonword = re.compile(r'\W', re.U)
+re_edition = re.compile(' ed edition$')
+
+ol = OpenLibrary('http://openlibrary.org/')
+
+conn = MySQLdb.connect(db='merge_editions')
+cur = conn.cursor()
+
+skip = 'guineapigscomple00elwa'
+skip = None
+total = 5601
+cur.execute("select ia, editions, done, unmerge_count from merge where unmerge_count != 0") # and ia='hantayo00hillrich'")
+unmerge_field_counts = defaultdict(int)
+num = 0
+for ia, ekeys, done, unmerge_count in cur.fetchall():
+#    if unmerge_count == 0:
+#        continue
+    num += 1
+    if num % 100 == 0:
+        print('%d/%d %.2f%%' % (num, total, ((float(num) * 100) / total)), ia)
+    if skip:
+        if skip == ia:
+            skip = None
+        continue
+    ekeys = ['/books/OL%dM' % x for x in sorted(int(re_edition_key.match(ekey).group(1)) for ekey in ekeys.split(' '))]
+    min_ekey = ekeys[0]
+
+    if len(ekeys) > 3:
+        print(ia, ekeys)
+    editions = [ol.get(ekey) for ekey in ekeys]
+    all_keys = set()
+    for e in editions:
+        for k in 'classifications', 'identifiers', 'table_of_contents':
+            if k in e and not e[k]:
+                del e[k]
+    for e in editions:
+        all_keys.update(e.keys())
+    for k in 'latest_revision', 'revision', 'created', 'last_modified', 'key', 'type', 'genres':
+        if k in all_keys:
+            all_keys.remove(k)
+
+    for k in all_keys.copy():
+        if k.startswith('subject'):
+            all_keys.remove(k)
+
+    for e in editions: # resolve redirects
+        if 'authors' not in e:
+            continue
+        new_authors = []
+        for akey in e['authors']:
+            a = ol.get(akey)
+            if a['type'] == Reference('/type/redirect'):
+                akey = Reference(a['location'])
+            else:
+                assert a['type'] == Reference('/type/author')
+            new_authors.append(akey)
+        e['authors'] = new_authors
+
+    merged = {}
+    k = 'publish_date'
+    publish_dates = set(e[k] for e in editions if k in e and len(e[k]) != 4)
+
+    k = 'pagination'
+    all_pagination = set(e[k].strip(':.') for e in editions if e.get(k))
+
+    one_item_lists = {}
+    for k in 'lc_classifications', 'publishers', 'contributions', 'series', 'authors':
+        one_item_lists[k] = set(e[k][0].strip('.') for e in editions if e.get(k) and len(set(e[k])) == 1)
+
+    for k in 'source_records', 'ia_box_id':
+        merged[k] = []
+        for e in editions:
+            for sr in e.get(k, []):
+                if sr not in merged[k]:
+                    merged[k].append(sr)
+
+    for k in ['other_titles', 'isbn_10', 'series', 'oclc_numbers', 'publishers']:
+        if k not in all_keys:
+            continue
+        merged[k] = []
+        for e in editions:
+            for sr in e.get(k, []):
+                if sr not in merged[k]:
+                    merged[k].append(sr)
+
+    k = 'ocaid'
+    for e in editions:
+        if e.get(k) and 'ia:' + e[k] not in merged['source_records']:
+            merged['source_records'].append(e[k])
+
+    k = 'identifiers'
+    if k in all_keys:
+        merged[k] = {}
+        for e in editions:
+            if k not in e:
+                continue
+            for a, b in e[k].items():
+                for c in b:
+                    if c in merged[k].setdefault(a, []):
+                        continue
+                    merged[k][a].append(c)
+
+    any_publish_country = False
+    k = 'publish_country'
+    if k in all_keys:
+        for e in editions:
+            if e.get(k) and not e[k].strip().startswith('xx'):
+                any_publish_country = True
+
+    skip_fields = set(['source_records', 'ia_box_id', 'identifiers', 'ocaid', 'other_titles', 'series', 'isbn_10'])
+    for k in all_keys:
+        if k in skip_fields:
+            continue
+
+        uniq = defaultdict(list)
+        for num, e in enumerate(editions):
+            if e.get(k):
+                if k == 'publish_date' and len(e[k]) == 4 and e[k].isdigit and any(e[k] in pd for pd in publish_dates):
+                    continue
+                if k == 'pagination' and any(len(i) > len(e[k].strip('.:')) and e[k].strip('.:') in i for i in all_pagination):
+                    continue
+                if k in one_item_lists and len(set(e.get(k, []))) == 1 and any(len(i) > len(e[k][0].strip('.')) and e[k][0].strip('.') in i for i in one_item_lists[k]):
+                    continue
+                if k == 'publish_country' and any_publish_country and e.get(k, '').strip().startswith('xx'):
+                    continue
+                if k == 'edition_name' and e[k].endswith(' ed edition'):
+                    e[k] = e[k][:-len(' edition')]
+                uniq[re_nonword.sub('', repr(e[k]).lower())].append(num)
+
+        if len(uniq) == 1:
+            merged[k] = uniq.keys()[0]
+            merged[k] = editions[uniq.values()[0][0]][k]
+            continue
+
+        if k == 'covers':
+            assert all(isinstance(e[k], list) for e in editions if k in e)
+            covers = set()
+            for e in editions:
+                if k in e:
+                    covers.update(c for c in e[k] if c != -1)
+            merged['covers'] = sorted(covers)
+            continue
+
+        if k == 'notes':
+            merged['notes'] = ''
+            for e in editions:
+                if e.get('notes'):
+                    merged['notes'] += e['notes'] + '\n'
+            continue
+
+        if k == 'ocaid':
+            for e in editions:
+                if e.get('ocaid'):
+                    if e['ocaid'].endswith('goog'):
+                        print(e['key'], e['ocaid'], ia)
+                    merged['ocaid'] = e['ocaid']
+                    break
+            assert merged['ocaid']
+            continue
+
+        if k =='authors':
+            min_author = set(min((e.get('authors', []) for e in editions), key=len))
+            if all(min_author <= set(e.get('authors', [])) for e in editions):
+                merged[k] = max((e.get('authors', []) for e in editions), key=len)
+                continue
+        merged[k] = None
+    unmerged = len([1 for v in merged.values() if v is None])
+    if unmerged == 1:
+        assert len([k for k, v in merged.items() if v is None]) == 1
+        for k, v in merged.items():
+            if v is None:
+                if k == 'series':
+                    print(ia, [e[k] for e in editions if e.get(k)])
+                unmerge_field_counts[k] += 1
+    #print 'unmerged count', unmerged, ia, ekeys
+    cur.execute('update merge set unmerge_count=%s where ia=%s', [unmerged, ia])
+
+print(dict(unmerge_field_counts))
+print(unmerge_field_counts.items())
+for k,v in sorted(unmerge_field_counts.items(), key=lambda i:i[1]):
+    print('%30s: %d' % (k, v))
diff --git a/ia-legacy-importer/edition_merge/merge.py b/ia-legacy-importer/edition_merge/merge.py
new file mode 100644
index 00000000..688b1130
--- /dev/null
+++ b/ia-legacy-importer/edition_merge/merge.py
@@ -0,0 +1,247 @@
+#!/usr/bin/python
+
+import MySQLdb
+import datetime
+import re
+import sys
+sys.path.append('/1/src/openlibrary')
+from openlibrary.api import OpenLibrary, Reference
+from flask import Flask, render_template, request, flash, redirect, url_for, g
+from collections import defaultdict
+app = Flask(__name__)
+
+re_edition_key = re.compile('^/books/OL(\d+)M$')
+
+ol = OpenLibrary('http://openlibrary.org/')
+ol.login('EdwardBot', 'As1Wae9b')
+
+@app.before_request
+def before_request():
+    g.db = MySQLdb.connect(db='merge_editions')
+
+@app.after_request
+def after_request(r):
+    g.db.close()
+    return r
+
+re_nonword = re.compile(r'\W', re.U)
+
+rows = 200
+
+app.secret_key = 'rt9%s#)5kid$!u*5_@*$f2f_%jq++nl3@d%=7f%v4&78^m4p7c'
+
+@app.route("/")
+def index():
+    page = int(request.args.get('page', 1))
+    cur = g.db.cursor()
+    cur.execute('select count(*) from merge where done is null')
+    total = cur.fetchone()[0]
+    cur.execute('select count(*) from merge where done is null and unmerge_count = 0')
+    easy = cur.fetchone()[0]
+    cur.execute('select ia, editions, unmerge_count from merge where done is null limit %s offset %s', [rows, (page-1) * rows])
+    reply = cur.fetchall()
+    return render_template('index.html', merge_list=reply, total=total, rows=rows, page=page, easy=easy )
+
+def run_merge(ia):
+    cur = g.db.cursor()
+    cur.execute('select editions from merge where ia=%s', ia)
+    [ekeys] = cur.fetchone()
+    ekeys = ['/books/OL%dM' % x for x in sorted(int(re_edition_key.match(ekey).group(1)) for ekey in ekeys.split(' '))]
+    min_ekey = ekeys[0]
+
+    editions = [ol.get(ekey) for ekey in ekeys]
+    editions_by_key = dict((e['key'][7:], e) for e in editions)
+    merged = build_merged(editions)
+
+    missing = []
+    for k, v in merged.items():
+        if v is not None:
+            continue
+        use_ekey = request.form.get(k)
+        if use_ekey is None:
+            missing.append(k)
+            continue
+        merged[k] = editions_by_key[use_ekey][k]
+    if missing:
+        flash('please select: ' + ', '.join(missing))
+        return redirect(url_for('merge', ia=ia))
+
+    master = ol.get(min_ekey)
+    for k, v in merged.items():
+        master[k] = v
+
+    updates = []
+    updates.append(master)
+    for ekey in ekeys:
+        if ekey == min_ekey:
+            continue
+        ol_redirect = {
+            'type': Reference('/type/redirect'),
+            'location': min_ekey,
+            'key': ekey,
+        }
+        updates.append(ol_redirect)
+    #print len(updates), min_ekey
+    try:
+        ol.save_many(updates, 'merge lending editions')
+    except:
+        #for i in updates:
+        #    print i
+        raise
+    cur.execute('update merge set done=now() where ia=%s', [ia])
+
+    flash(ia + ' merged')
+    return redirect(url_for('index'))
+
+def build_merged(editions):
+    all_keys = set()
+
+    for e in editions:
+        for k in 'classifications', 'identifiers':
+            if k in e and not e[k]:
+                del e[k]
+
+    for e in editions:
+        all_keys.update(e.keys())
+
+    for k in 'latest_revision', 'revision', 'created', 'last_modified', 'key', 'type', 'genres':
+        if k in all_keys:
+            all_keys.remove(k)
+
+    for k in all_keys.copy():
+        if k.startswith('subject'):
+            all_keys.remove(k)
+
+    merged = {}
+    k = 'publish_date'
+    publish_dates = set(e[k] for e in editions if k in e and len(e[k]) != 4)
+
+    k = 'pagination'
+    all_pagination = set(e[k] for e in editions if e.get(k))
+
+    one_item_lists = {}
+    for k in 'lc_classifications', 'publishers', 'contributions', 'series':
+        one_item_lists[k] = set(e[k][0].strip('.') for e in editions if e.get(k) and len(set(e[k])) == 1)
+
+    for k in 'source_records', 'ia_box_id':
+        merged[k] = []
+        for e in editions:
+            for sr in e.get(k, []):
+                if sr not in merged[k]:
+                    merged[k].append(sr)
+
+    for k in ['other_titles', 'isbn_10', 'series']:
+        if k not in all_keys:
+            continue
+        merged[k] = []
+        for e in editions:
+            for sr in e.get(k, []):
+                if sr not in merged[k]:
+                    merged[k].append(sr)
+
+
+    k = 'ocaid'
+    for e in editions:
+        if e.get(k) and 'ia:' + e[k] not in merged['source_records']:
+            merged['source_records'].append(e[k])
+
+    k = 'identifiers'
+    if k in all_keys:
+        merged[k] = {}
+        for e in editions:
+            if k not in e:
+                continue
+            for a, b in e[k].items():
+                for c in b:
+                    if c in merged[k].setdefault(a, []):
+                        continue
+                    merged[k][a].append(c)
+
+    any_publish_country = False
+    k = 'publish_country'
+    if k in all_keys:
+        for e in editions:
+            if e.get(k) and not e[k].strip().startswith('xx'):
+                any_publish_country = True
+
+    for k in all_keys:
+        if k in ('source_records', 'ia_box_id', 'identifiers'):
+            continue
+
+        uniq = defaultdict(list)
+        for num, e in enumerate(editions):
+            if e.get(k):
+                if k == 'publish_date' and len(e[k]) == 4 and e[k].isdigit and any(e[k] in pd for pd in publish_dates):
+                    continue
+                if k == 'pagination' and any(len(i) > len(e[k]) and e[k] in i for i in all_pagination):
+                    continue
+                if k in one_item_lists and len(set(e.get(k, []))) == 1 and any(len(i) > len(e[k][0].strip('.')) and e[k][0].strip('.') in i for i in one_item_lists[k]):
+                    continue
+                if k == 'publish_country' and any_publish_country and e.get(k, '').strip().startswith('xx'):
+                    continue
+                if k == 'edition_name' and e[k].endswith(' ed edition'):
+                    e[k] = e[k][:-len(' edition')]
+                uniq[re_nonword.sub('', repr(e[k]).lower())].append(num)
+
+        if len(uniq) == 1:
+            #merged[k] = uniq.keys()[0]
+            merged[k] = editions[uniq.values()[0][0]][k]
+            continue
+
+        if k == 'covers':
+            assert all(isinstance(e[k], list) for e in editions if k in e)
+            covers = set()
+            for e in editions:
+                if k in e:
+                    covers.update(c for c in e[k] if c != -1)
+            merged['covers'] = sorted(covers)
+            continue
+
+        if k == 'notes':
+            merged['notes'] = ''
+            for e in editions:
+                if e.get('notes'):
+                    merged['notes'] += e['notes'] + '\n'
+            continue
+
+        if k == 'ocaid':
+            for e in editions:
+                if e.get('ocaid'):
+                    #assert not e['ocaid'].endswith('goog')
+                    merged['ocaid'] = e['ocaid']
+                    break
+            assert merged['ocaid']
+            continue
+        merged[k] = None
+
+    return merged
+
+@app.route("/merge/<ia>", methods=['GET', 'POST'])
+def merge(ia):
+    if request.method == 'POST':
+        return run_merge(ia)
+
+    cur = g.db.cursor()
+    cur.execute('select ia, editions, done from merge where ia = %s', [ia])
+    ia, ekeys, done = cur.fetchone()
+    ekeys = ['/books/OL%dM' % x for x in sorted(int(re_edition_key.match(ekey).group(1)) for ekey in ekeys.split(' '))]
+    min_ekey = ekeys[0]
+
+    editions = [ol.get(ekey) for ekey in ekeys]
+
+    merged = build_merged(editions)
+    all_keys = merged.keys()
+
+    works = []
+
+    return render_template('merge.html',
+            ia=ia,
+            editions=editions,
+            keys=sorted(all_keys),
+            merged = merged,
+            ekeys=ekeys,
+            works=works,
+            master=min_ekey)
+
+if __name__ == "__main__":
+    app.run(host='0.0.0.0', debug=True)
diff --git a/ia-legacy-importer/edition_merge/merge_works.py b/ia-legacy-importer/edition_merge/merge_works.py
new file mode 100644
index 00000000..4b591e71
--- /dev/null
+++ b/ia-legacy-importer/edition_merge/merge_works.py
@@ -0,0 +1,149 @@
+from __future__ import print_function
+import MySQLdb
+import datetime
+import re
+import sys
+from openlibrary.catalog.utils import cmp
+sys.path.append('/1/src/openlibrary')
+from openlibrary.api import OpenLibrary, Reference
+
+import six
+
+
+conn = MySQLdb.connect(db='merge_editions')
+cur = conn.cursor()
+
+re_edition_key = re.compile('^/books/OL(\d+)M$')
+re_work_key = re.compile('^/works/OL(\d+)W$')
+ol = OpenLibrary('http://openlibrary.org/')
+ol.login('EdwardBot', 'As1Wae9b')
+
+re_iso_date = re.compile('^(\d{4})-\d\d-\d\d$')
+re_end_year = re.compile('(\d{4})$')
+
+def get_publish_year(d):
+    if not d:
+        return
+    m = re_iso_date.match(d)
+    if m:
+        return int(m.group(1))
+    m = re_end_year.match(d)
+    if m:
+        return int(m.group(1))
+
+{'lc_classifications': ['PZ7.H558 Ru'], 'dewey_number': ['[E]']}
+def merge_works(works):
+    master = works.pop(0)
+    master_first_publish_year = get_publish_year(master.get('first_publish_date'))
+    subtitles = sorted((w['subtitle'] for w in works if w.get('subtitle')), key=lambda s: len(s))
+    if subtitles and len(subtitles[-1]) > len(master.get('subtitle', '')):
+        master['subtitle'] = subtitles[-1]
+    updates = []
+    for w in works:
+        wkey = w.pop('key')
+        q = {'type': '/type/edition', 'works': wkey}
+        for ekey in ol.query(q):
+            e = ol.get(ekey)
+            assert len(e['works']) == 1 and e['works'][0] == wkey
+            e['works'] = [Reference(master['key'])]
+            updates.append(e)
+        assert w['type'] != Reference('/type/redirect')
+        updates.append({
+            'key': wkey,
+            'type': Reference('/type/redirect'),
+            'location': master['key'],
+        })
+        for f in 'covers', 'subjects', 'subject_places', 'subject_people', 'subject_times', 'lc_classifications', 'dewey_number':
+            if not w.get(f):
+                continue
+            assert not isinstance(w[f], six.string_types)
+            for i in w[f]:
+                if i not in master.setdefault(f, []):
+                    master[f].append(i)
+
+        if w.get('first_sentence') and not master.get('first_sentence'):
+            master['first_sentence'] = w['first_sentence']
+        if w.get('first_publish_date'):
+            if not master.get('first_publish_date'):
+                master['first_publish_date'] = w['first_publish_date']
+            else:
+                publish_year = get_publish_year(w['first_publish_date'])
+                if publish_year < master_first_publish_year:
+                    master['first_publish_date'] = w['first_publish_date']
+                    master_first_publish_year = publish_year
+
+        for excerpt in w.get('exceprts', []):
+            master.setdefault('exceprts', []).append(excerpt)
+
+        for f in 'title', 'subtitle', 'created', 'last_modified', 'latest_revision', 'revision', 'number_of_editions', 'type', 'first_sentence', 'authors', 'first_publish_date', 'excerpts', 'covers', 'subjects', 'subject_places', 'subject_people', 'subject_times', 'lc_classifications', 'dewey_number':
+            try:
+                del w[f]
+            except KeyError:
+                pass
+
+        print(w)
+        assert not w
+    updates.append(master)
+    print(len(updates), [(doc['key'], doc['type']) for doc in updates])
+    # update master
+    # update editions to point at master
+    # replace works with redirects
+    print(ol.save_many(updates, 'merge works'))
+
+skip = 'seventeenagainst00voig'
+skip = 'inlineskatingbas00sava'
+skip = 'elephantatwaldor00mira'
+skip = 'sybasesqlserverp00paul'
+skip = 'karmadunl00dunl'
+skip = 'norbychronicles00asim'
+skip = 'elizabethbarrett00fors'
+skip = None
+updates = []
+cur.execute('select ia, editions, done, unmerge_count from merge')
+for ia, ekeys, done, unmerge_count in cur.fetchall():
+    if skip:
+        if ia == skip:
+            skip = None
+        else:
+            continue
+    ekeys = ['/books/OL%dM' % x for x in sorted(int(re_edition_key.match(ekey).group(1)) for ekey in ekeys.split(' '))]
+    editions = [ol.get(ekey) for ekey in ekeys]
+
+    if any('authors' not in e or 'works' not in e for e in editions):
+        continue
+    author0 = editions[0]['authors'][0]
+    work0 = editions[0]['works'][0]
+    try:
+        if not all(author0 == e['authors'][0] for e in editions[1:]):
+            continue
+    except:
+        print('editions:', [e['key'] for e in editions])
+        raise
+    if all(work0 == e['works'][0] for e in editions[1:]):
+        continue
+    wkeys = []
+    for e in editions:
+        for wkey in e['works']:
+            if wkey not in wkeys:
+                wkeys.append(wkey)
+
+    works = []
+    for wkey in wkeys:
+        w = ol.get(wkey)
+        q = {'type': '/type/edition', 'works': wkey, 'limit': 1000}
+        w['number_of_editions'] = len(ol.query(q))
+        works.append(w)
+    title0 = works[0]['title'].lower()
+    if not all(w['title'].lower() == title0 for w in works[1:]):
+        continue
+    print(ia, ekeys)
+    print('  works:', wkeys)
+    def work_key_int(wkey):
+        return int(re_work_key.match(wkey).group(1))
+    works = sorted(works, cmp=lambda a,b:-cmp(a['number_of_editions'],b['number_of_editions']) or cmp(work_key_int(a['key']), work_key_int(b['key'])))
+    print('  titles:', [(w['title'], w['number_of_editions']) for w in works])
+    print(author0)
+    #print [w['authors'][0]['author'] for w in works]
+    assert all(author0 == w['authors'][0]['author'] for w in works)
+    merge_works(works)
+    print()
diff --git a/ia-legacy-importer/edition_merge/run_merge.py b/ia-legacy-importer/edition_merge/run_merge.py
new file mode 100644
index 00000000..5110ec45
--- /dev/null
+++ b/ia-legacy-importer/edition_merge/run_merge.py
@@ -0,0 +1,185 @@
+from __future__ import print_function
+import MySQLdb
+import datetime
+import re
+import sys
+from openlibrary.api import OpenLibrary, Reference
+from collections import defaultdict
+
+import six
+
+
+re_edition_key = re.compile('^/books/OL(\d+)M$')
+re_nonword = re.compile(r'\W', re.U)
+
+conn = MySQLdb.connect(db='merge_editions')
+cur = conn.cursor()
+cur2 = conn.cursor()
+
+ol = OpenLibrary('http://openlibrary.org/')
+ol.login('EdwardBot', 'As1Wae9b')
+
+cur.execute('select ia, editions, done from merge where done is null and unmerge_count=0')
+for ia, ekeys, done in cur.fetchall():
+    updates = []
+    ekeys = ['/books/OL%dM' % x for x in sorted(int(re_edition_key.match(ekey).group(1)) for ekey in ekeys.split(' '))]
+    print((ia, ekeys))
+    min_ekey = ekeys[0]
+    editions = [ol.get(ekey) for ekey in ekeys]
+    master = editions[0]
+
+    for e in editions:
+        for k in 'classifications', 'identifiers', 'table_of_contents':
+            if k in e and not e[k]:
+                del e[k]
+
+    all_keys = set()
+    for e in editions:
+        all_keys.update(k for k, v in e.items() if v)
+    for k in 'latest_revision', 'revision', 'created', 'last_modified', 'key', 'type', 'genres':
+        if k in all_keys:
+            all_keys.remove(k)
+
+    for k in all_keys.copy():
+        if k.startswith('subject'):
+            all_keys.remove(k)
+
+    for e in editions: # resolve redirects
+        if 'authors' not in e:
+            continue
+        new_authors = []
+        for akey in e['authors']:
+            a = ol.get(akey)
+            if a['type'] == Reference('/type/redirect'):
+                akey = Reference(a['location'])
+            else:
+                assert a['type'] == Reference('/type/author')
+            new_authors.append(akey)
+        e['authors'] = new_authors
+
+    k = 'publish_date'
+    publish_dates = set(e[k] for e in editions if k in e and len(e[k]) != 4)
+
+    k = 'pagination'
+    all_pagination = set(e[k].strip(':.') for e in editions if e.get(k))
+
+    one_item_lists = {}
+    for k in 'lc_classifications', 'publishers', 'contributions', 'series':
+        one_item_lists[k] = set(e[k][0].strip('.') for e in editions if e.get(k) and len(set(e[k])) == 1)
+
+
+    master.setdefault('source_records', [])
+    for k in 'source_records', 'ia_box_id', 'other_titles','isbn_10','series':
+        for e in editions[1:]:
+            if not e.get(k):
+                continue
+            for i in e[k]:
+                if i not in master.setdefault(k, []):
+                    master[k].append(i)
+
+    k = 'ocaid'
+    for e in editions[1:]:
+        if e.get(k) and 'ia:' + e[k] not in master['source_records']:
+            master['source_records'].append(e[k])
+
+    k = 'identifiers'
+    if any(k in e for e in editions):
+        master.setdefault(k, {})
+        for e in editions[1:]:
+            if k not in e:
+                continue
+            for a, b in e[k].items():
+                for c in b:
+                    if c in master[k].setdefault(a, []):
+                        continue
+                    master[k][a].append(c)
+
+    any_publish_country = False
+    k = 'publish_country'
+    if k in all_keys:
+        for e in editions:
+            if e.get(k) and not e[k].strip().startswith('xx'):
+                any_publish_country = True
+
+    no_merge = False
+    skip_fields = set(['source_records', 'ia_box_id', 'identifiers', 'ocaid', 'other_titles', 'series', 'isbn_10'])
+    for k in all_keys:
+        if k in skip_fields:
+            continue
+
+        uniq = defaultdict(list)
+        for num, e in enumerate(editions):
+            if e.get(k):
+                if k == 'publish_date' and len(e[k]) == 4 and e[k].isdigit and any(e[k] in pd for pd in publish_dates):
+                    continue
+                if k == 'pagination' and any(len(i) > len(e[k].strip('.:')) and e[k].strip('.:') in i for i in all_pagination):
+                    continue
+                if k in one_item_lists and len(set(e.get(k, []))) == 1 and any(len(i) > len(e[k][0].strip('.')) and e[k][0].strip('.') in i for i in one_item_lists[k]):
+                    continue
+                if k == 'publish_country' and any_publish_country and e.get(k, '').strip().startswith('xx'):
+                    continue
+                if k == 'edition_name' and e[k].endswith(' ed edition'):
+                    e[k] = e[k][:-len(' edition')]
+                uniq[re_nonword.sub('', repr(e[k]).lower())].append(num)
+
+        if len(uniq) == 0:
+            continue
+        if len(uniq) == 1:
+            master[k] = editions[uniq.values()[0][0]][k]
+            continue
+
+        if k == 'covers':
+            assert all(isinstance(e[k], list) for e in editions if k in e)
+            covers = set()
+            for e in editions:
+                if k in e:
+                    covers.update(c for c in e[k] if c != -1)
+            master['covers'] = sorted(covers)
+            continue
+
+        if k == 'notes':
+            master['notes'] = ''
+            for e in editions:
+                if e.get('notes'):
+                    master['notes'] += e['notes'] + '\n'
+            continue
+
+        if k == 'ocaid':
+            for e in editions:
+                if e.get('ocaid'):
+                    if e['ocaid'].endswith('goog'):
+                        print(e['key'], e['ocaid'], ia)
+                    master['ocaid'] = e['ocaid']
+                    break
+            assert master['ocaid']
+            continue
+
+        if k == 'authors':
+            min_author = set(min((e.get('authors', []) for e in editions), key=len))
+            if all(min_author <= set(e.get('authors', [])) for e in editions):
+                master[k] = max((e.get('authors', []) for e in editions), key=len)
+                continue
+
+        print('unmerged field:', k)
+        print([e.get(k) for e in editions])
+        no_merge = True
+    if no_merge:
+        continue
+    if 'location' in master and isinstance(master['location'], six.string_types) and master['location'].startswith('/books/'):
+        del master['location']
+    updates.append(master)
+    for e in editions[1:]:
+        redirect = {
+            'type': Reference('/type/redirect'),
+            'location': min_ekey,
+            'key': e['key'],
+        }
+        updates.append(redirect)
+    print(len(updates), min_ekey)
+    try:
+        print(ol.save_many(updates, 'merge lending editions'))
+    except:
+        for i in updates:
+            print(i)
+        raise
+    cur2.execute('update merge set done=now() where ia=%s', [ia])
diff --git a/ia-legacy-importer/edition_merge/schema.sql b/ia-legacy-importer/edition_merge/schema.sql
new file mode 100644
index 00000000..080effaf
--- /dev/null
+++ b/ia-legacy-importer/edition_merge/schema.sql
@@ -0,0 +1,5 @@
+create table merge (
+    ia varchar(255) not null primary key,
+    editions varchar(255) not null,
+    done datetime
+);
diff --git a/ia-legacy-importer/edition_merge/templates/index.html b/ia-legacy-importer/edition_merge/templates/index.html
new file mode 100644
index 00000000..65f06247
--- /dev/null
+++ b/ia-legacy-importer/edition_merge/templates/index.html
@@ -0,0 +1,61 @@
+<html>
+<head>
+<title>Merge duplicate editions</title>
+<style>
+td { vertical-align: top; background: #ddd };
+</style>
+</head>
+<body>
+<h1>Merge duplicate editions</h1>
+
+{% with messages = get_flashed_messages() %}
+  {% if messages %}
+    <ul class=flashes>
+    {% for message in messages %}
+      <li>{{ message }}</li>
+    {% endfor %}
+    </ul>
+  {% endif %}
+{% endwith %}
+
+{% macro pager() %}
+Pages:
+{% for i in range((total / rows)+1) %}
+{% if i + 1 == page %}
+{{ page }}
+{% else %}
+<a href="?page={{ i + 1 }}">{{ i + 1}}</a>
+{% endif %}
+{% endfor %}
+<p>
+{% endmacro %}
+
+{{ pager() }}
+
+{{ total }} items need to be merged ({{ easy }} easy)<p>
+
+<table>
+{% for ia, editions, unmerge_count in merge_list %}
+<tr>
+<td><a href="//archive.org/details/{{ ia }}">{{ ia }}</a></td>
+<td>
+{% for ekey in editions.split(' ') %}
+<a href="https://openlibrary.org{{ ekey }}">{{ekey}}</a>
+{% endfor %}
+</td>
+<td><a href="{{url_for('merge', ia=ia)}}">merge</a></td>
+{% if unmerge_count == 0 %}
+<td style="background: green; color: white">
+{% else %}
+<td>
+{% endif %}
+{{ unmerge_count }}
+</td>
+</tr>
+{% endfor %}
+</table>
+
+{{ pager() }}
+
+</body>
+</html>
diff --git a/ia-legacy-importer/edition_merge/templates/merge.html b/ia-legacy-importer/edition_merge/templates/merge.html
new file mode 100644
index 00000000..497418d6
--- /dev/null
+++ b/ia-legacy-importer/edition_merge/templates/merge.html
@@ -0,0 +1,88 @@
+<html>
+<head>
+<title>Merge {{ia}}</title>
+<script src="http://ajax.googleapis.com/ajax/libs/jquery/1.6.4/jquery.min.js"></script>
+<style>
+td { vertical-align: top; background: #ddd };
+</style>
+</head>
+<body>
+<h1>Merge {{ia}}</h1>
+
+<a href="{{url_for('index')}}">back to index</a><p>
+
+{% with messages = get_flashed_messages() %}
+  {% if messages %}
+    <ul class=flashes>
+    {% for message in messages %}
+      <li>{{ message }}</li>
+    {% endfor %}
+    </ul>
+  {% endif %}
+{% endwith %}
+
+
+
+Merging editions: {{ ekeys }} into {{ master }}<p>
+
+<form method="post">
+<table>
+<tr><td></td>
+{% for ekey in ekeys %}
+<td><a href="https://openlibrary.org{{ekey}}">{{ ekey }}</a></td>
+{% endfor %}
+<td>merged</td>
+</tr>
+{% for k in keys %}
+<tr>
+<td>{{ k }}</td>
+{% for e in editions %}
+{% set ekey = e['key'][7:] %}
+<td>
+{% if k == 'notes' and e.get(k) %}
+{% for line in e[k].splitlines() %}
+{{ line }}<br>
+{% endfor %}
+{% elif k == 'authors' and e.get(k) %}
+{% for akey in e[k] %}
+    <a href="https://openlibrary.org{{akey}}.yml?m=edit">{{akey}}</a>
+{% endfor %}
+
+{% elif not merged.get(k) and e.get(k) %}
+    <input type="radio" name="{{k}}" value="{{ekey}}"><span onclick="$('input:radio[name={{k}}]').filter('[value={{ekey}}]').attr('checked', true)">{{ e.get(k) }}</span>
+{% else %}
+{{ e.get(k) }}
+{% endif %}
+</td>
+{% endfor %}
+{% if merged.get(k) %}
+<td style="background: green; color: white">
+{% if k == 'notes' %}
+{% for line in merged[k].splitlines() %}
+{{ line }}<br>
+{% endfor %}
+{% else %}
+{{ merged[k] }}
+{% endif %}
+</td>
+{% else %}
+<td style="background: red"></td>
+{% endif %}
+</tr>
+{% endfor %}
+<tr>
+<td colspan="3"></td>
+<td><input type="submit" value="merge"></td>
+</tr>
+</table>
+
+<input type="submit" value="merge">
+</form>
+
+<!--
+<h3>Works</h3>
+<pre>{{ works | pprint }}</pre>
+-->
+
+</body>
+</html>
diff --git a/ia-legacy-importer/edition_merge/templates/web_merge.html b/ia-legacy-importer/edition_merge/templates/web_merge.html
new file mode 100644
index 00000000..97d78109
--- /dev/null
+++ b/ia-legacy-importer/edition_merge/templates/web_merge.html
@@ -0,0 +1,58 @@
+<html>
+<head>
+<title>Merge {{ia}}</title>
+<style>
+td { vertical-align: top; background: #ddd };
+</style>
+</head>
+<body>
+<h1>Merge {{ia}}</h1>
+
+Merging editions: {{ ekeys }} into {{ master }}<p>
+
+<a href="/?master=merge&ia={{ia}}&skip={{skip}}">merge lists</a> &bull; <a href="/?skip={{skip+1}}">skip</a><p>
+
+<table>
+<tr><td></td>
+{% for ekey in ekeys %}
+<td><a href="https://openlibrary.org{{ekey}}">{{ ekey }}</a></td>
+<td><a href="/?master={{ekey}}&ia={{ia}}&skip={{skip}}">merge</a></td>
+{% endfor %}
+<td>merged</td>
+</tr>
+{% for k in keys %}
+<tr>
+<td>{{ k }}</td>
+{% for e in editions %}
+<td colspan="2">
+{% if k == 'notes' and e.get(k) %}
+{% for line in e[k].splitlines() %}
+{{ line }}<br>
+{% endfor %}
+{% else %}
+{{ e.get(k) }}
+{% endif %}
+</td>
+{% endfor %}
+{% if merged.get(k) %}
+<td style="background: green; color: white">
+{% if k == 'notes' %}
+{% for line in merged[k].splitlines() %}
+{{ line }}<br>
+{% endfor %}
+{% else %}
+{{ merged[k] }}
+{% endif %}
+</td>
+{% else %}
+<td style="background: red"></td>
+{% endif %}
+</tr>
+{% endfor %}
+</table>
+
+<h3>Works</h3>
+<pre>{{ works | pprint }}</pre>
+
+</body>
+</html>
diff --git a/ia-legacy-importer/get_ia.py b/ia-legacy-importer/get_ia.py
new file mode 100644
index 00000000..4be5926e
--- /dev/null
+++ b/ia-legacy-importer/get_ia.py
@@ -0,0 +1,258 @@
+from __future__ import print_function
+
+import os.path
+import socket
+import traceback
+import xml.parsers.expat
+
+from infogami import config
+from lxml import etree
+from six.moves import urllib
+from time import sleep
+
+from openlibrary.catalog.marc.marc_binary import MarcBinary
+from openlibrary.catalog.marc.marc_xml import MarcXml
+from openlibrary.catalog.marc.parse import read_edition
+from openlibrary.catalog.marc.fast_parse import read_file as fast_read_file  # Deprecated import
+from openlibrary.core import ia
+
+
+IA_BASE_URL = config.get('ia_base_url')
+IA_DOWNLOAD_URL = '%s/download/' % IA_BASE_URL
+MAX_MARC_LENGTH = 100000
+
+class NoMARCXML(IOError):
+    # DEPRECATED, rely on MarcXml to raise exceptions
+    pass
+
+def urlopen_keep_trying(url):
+    for i in range(3):
+        try:
+            f = urllib.request.urlopen(url)
+            return f
+        except urllib.error.HTTPError as error:
+            if error.code in (403, 404, 416):
+                raise
+        except urllib.error.URLError:
+            pass
+        sleep(2)
+
+def bad_ia_xml(identifier):
+    # DEPRECATED
+    if identifier == 'revistadoinstit01paulgoog':
+        return False
+    # need to handle 404s:
+    # http://www.archive.org/details/index1858mary
+    loc = "{0}/{0}_marc.xml".format(identifier)
+    return '<!--' in urlopen_keep_trying(IA_DOWNLOAD_URL + loc).read()
+
+def get_marc_record_from_ia(identifier):
+    """
+    Takes IA identifiers and returns MARC record instance.
+    08/2018: currently called by openlibrary/plugins/importapi/code.py
+    when the /api/import/ia endpoint is POSTed to.
+
+    :param str identifier: ocaid
+    :rtype: MarcXML | MarcBinary
+    """
+    metadata = ia.get_metadata(identifier)
+    filenames = metadata['_filenames']
+
+    marc_xml_filename = identifier + '_marc.xml'
+    marc_bin_filename = identifier + '_meta.mrc'
+
+    item_base = '{}{}/'.format(IA_DOWNLOAD_URL, identifier)
+
+    # Try marc.xml first
+    if marc_xml_filename in filenames:
+        data = urlopen_keep_trying(item_base + marc_xml_filename).read()
+        try:
+            root = etree.fromstring(data)
+            return MarcXml(root)
+        except Exception as e:
+            print("Unable to read MarcXML: %s" % e)
+            traceback.print_exc()
+
+    # If that fails, try marc.bin
+    if marc_bin_filename in filenames:
+        data = urlopen_keep_trying(item_base + marc_bin_filename).read()
+        return MarcBinary(data)
+
+def get_ia(identifier):
+    """
+    DEPRECATED: Use get_marc_record_from_ia() above + parse.read_edition()
+
+    :param str identifier: ocaid
+    :rtype: dict
+    """
+    marc = get_marc_record_from_ia(identifier)
+    return read_edition(marc)
+
+def files(identifier):
+    url = item_file_url(identifier, 'files.xml')
+    for i in range(5):
+        try:
+            tree = etree.parse(urlopen_keep_trying(url))
+            break
+        except xml.parsers.expat.ExpatError:
+            sleep(2)
+    try:
+        tree = etree.parse(urlopen_keep_trying(url))
+    except:
+        print("error reading", url)
+        raise
+    assert tree
+    for i in tree.getroot():
+        assert i.tag == 'file'
+        name = i.attrib['name']
+        if name == 'wfm_bk_marc' or name.endswith('.mrc') or name.endswith('.marc') or name.endswith('.out') or name.endswith('.dat') or name.endswith('.records.utf8'):
+            size = i.find('size')
+            if size is not None:
+                yield name, int(size.text)
+            else:
+                yield name, None
+
+def get_from_archive(locator):
+    """
+    Gets a single binary MARC record from within an Archive.org
+    bulk MARC item - data only.
+
+    :param str locator: Locator ocaid/filename:offset:length
+    :rtype: str|None
+    :return: Binary MARC data
+    """
+    data, offset, length = get_from_archive_bulk(locator)
+    return data
+
+def get_from_archive_bulk(locator):
+    """
+    Gets a single binary MARC record from within an Archive.org
+    bulk MARC item, and return the offset and length of the next
+    item.
+    If offset or length are `None`, then there is no next record.
+
+    :param str locator: Locator ocaid/filename:offset:length
+    :rtype: (str|None, int|None, int|None)
+    :return: (Binary MARC data, Next record offset, Next record length)
+    """
+    if locator.startswith('marc:'):
+        locator = locator[5:]
+    filename, offset, length = locator.split (":")
+    offset = int(offset)
+    length = int(length)
+
+    r0, r1 = offset, offset+length-1
+    # get the next record's length in this request
+    r1 += 5
+    url = IA_DOWNLOAD_URL + filename
+
+    assert 0 < length < MAX_MARC_LENGTH
+
+    ureq = urllib.request.Request(url, None, {'Range': 'bytes=%d-%d' % (r0, r1)})
+    f = urlopen_keep_trying(ureq)
+    data = None
+    if f:
+        data = f.read(MAX_MARC_LENGTH)
+        len_in_rec = int(data[:5])
+        if len_in_rec != length:
+            data, next_offset, next_length = get_from_archive_bulk('%s:%d:%d' % (filename, offset, len_in_rec))
+        else:
+            next_length = data[length:]
+            data = data[:length]
+            if len(next_length) == 5:
+                # We have data for the next record
+                next_offset = offset + len_in_rec
+                next_length = int(next_length)
+            else:
+                next_offset = next_length = None
+    return data, next_offset, next_length
+
+def read_marc_file(part, f, pos=0):
+    """
+    Generator to step through bulk MARC data f.
+
+    :param str part:
+    :param str f: Full binary MARC data containing many records
+    :param int pos: Start position within the data
+    :rtype: (int, str, str)
+    :return: (Next position, Current source_record name, Current single MARC record)
+    """
+    for data, int_length in fast_read_file(f):
+        loc = "marc:%s:%d:%d" % (part, pos, int_length)
+        pos += int_length
+        yield (pos, loc, data)
+
+def item_file_url(identifier, ending, host=None, path=None):
+    if host and path:
+        url = 'http://{}{}/{}_{}'.format(host, path, identifier, ending)
+    else:
+        url = '{0}{1}/{1}_{2}'.format(IA_DOWNLOAD_URL, identifier, ending)
+    return url
+
+def get_marc_ia_data(identifier, host=None, path=None):
+    """
+    DEPRECATED
+    """
+    url = item_file_url(identifier, 'meta.mrc', host, path)
+    f = urlopen_keep_trying(url)
+    return f.read() if f else None
+
+def marc_formats(identifier, host=None, path=None):
+    files = {
+        identifier + '_marc.xml': 'xml',
+        identifier + '_meta.mrc': 'bin',
+    }
+    has = { 'xml': False, 'bin': False }
+    url = item_file_url(identifier, 'files.xml', host, path)
+    for attempt in range(10):
+        f = urlopen_keep_trying(url)
+        if f is not None:
+            break
+        sleep(10)
+    if f is None:
+        #TODO: log this, if anything uses this code
+        msg = "error reading %s_files.xml" % identifier
+        return has
+    data = f.read()
+    try:
+        root = etree.fromstring(data)
+    except:
+        print(('bad:', repr(data)))
+        return has
+    for e in root:
+        name = e.attrib['name']
+        if name in files:
+            has[files[name]] = True
+        if all(has.values()):
+            break
+    return has
+
+def get_from_local(locator):
+    # DEPRECATED, Broken, undefined rc, will raise exception if called
+    try:
+        file, offset, length = locator.split(':')
+    except:
+        print(('locator:', repr(locator)))
+        raise
+    f = open(rc['marc_path'] + '/' + file)  # noqa: F821 DEPRECATED
+    f.seek(int(offset))
+    buf = f.read(int(length))
+    f.close()
+    return buf
+
+def get_data(loc):
+    # DEPRECATED, Broken, undefined rc, will return None or raise exception if called
+    try:
+        filename, p, l = loc.split(':')
+    except ValueError:
+        return None
+    marc_path = rc.get('marc_path')
+    if not marc_path:
+        return None
+    if not os.path.exists(marc_path + '/' + filename):
+        return None
+    f = open(rc['marc_path'] + '/' + filename)  # noqa: F821 DEPRECATED
+    f.seek(int(p))
+    buf = f.read(int(l))
+    f.close()
+    return buf
diff --git a/ia-legacy-importer/ia/__init__.py b/ia-legacy-importer/ia/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/ia-legacy-importer/ia/check_for_marc.py b/ia-legacy-importer/ia/check_for_marc.py
new file mode 100644
index 00000000..83467569
--- /dev/null
+++ b/ia-legacy-importer/ia/check_for_marc.py
@@ -0,0 +1,53 @@
+from __future__ import print_function
+from openlibrary.utils.ia import find_item
+from time import sleep
+import httplib
+import socket
+
+def head(host, path, ia):
+    conn = httplib.HTTPConnection(host)
+    conn.request("HEAD", path + "/" + ia + "_marc.xml")
+    return conn.getresponse()
+
+bad_machine = set()
+out = open('has_marc', 'w')
+no = open('no_marc', 'w')
+later = open('later', 'w')
+for line in open('to_load'):
+    ia = line[:-1]
+    if line.startswith('('):
+        print(ia, file=no)
+        continue
+    (host, path) = find_item(ia)
+    if not host:
+        print(ia, file=no)
+        continue
+    if host in bad_machine:
+        print(ia, file=later)
+        continue
+#    print "http://" + host + path + "/" + ia + "_marc.xml"
+    try:
+        r1 = head(host, path, ia)
+    except socket.error:
+        print('socket error')
+        print("http://" + host + path + "/" + ia + "_marc.xml")
+        print('try later')
+        bad_machine.add(ia)
+        print(ia, file=later)
+        continue
+        print('retry in 2 seconds')
+
+    if r1.status in (403, 404):
+        print(ia, file=no)
+        continue
+    if r1.status != 200:
+        print(ia, host, path)
+        print(r1.status, r1.reason)
+        print("http://" + host + path + "/" + ia + "_marc.xml")
+    assert r1.status == 200
+
+    print(ia)
+    print(ia, file=out)
+out.close()
+later.close()
+no.close()
diff --git a/ia-legacy-importer/ia/count_archive_books.py b/ia-legacy-importer/ia/count_archive_books.py
new file mode 100644
index 00000000..5d0ee3d5
--- /dev/null
+++ b/ia-legacy-importer/ia/count_archive_books.py
@@ -0,0 +1,18 @@
+from __future__ import print_function
+from catalog.read_rc import read_rc
+import web
+import sys
+rc = read_rc()
+web.config.db_parameters = dict(dbn='mysql', db='archive', user=rc['ia_db_user'], pw=rc['ia_db_pass'], host=rc['ia_db_host'])
+web.load()
+
+row = list(web.select('metadata', what='count(*) as num', where="scanner = 'google' and mediatype='texts' and noindex is null"))
+print('Image PDFs:', row[0].num)
+
+row = list(web.select('metadata', what='count(*) as num', where="scanner != 'google' and noindex is null and mediatype='texts'"))
+print('Scanned books:', row[0].num)
+
+sys.exit(0)
+
+for row in web.select('metadata', scanner='google'):
+    print(row.identifier)
diff --git a/ia-legacy-importer/ia/extract_paragraphs.py b/ia-legacy-importer/ia/extract_paragraphs.py
new file mode 100644
index 00000000..eb449f0a
--- /dev/null
+++ b/ia-legacy-importer/ia/extract_paragraphs.py
@@ -0,0 +1,103 @@
+from __future__ import print_function
+from xml.etree.cElementTree import iterparse, tostring, Element
+import sys
+import re
+
+ns = '{http://www.abbyy.com/FineReader_xml/FineReader6-schema-v1.xml}'
+page_tag = ns + 'page'
+
+re_par_end_dot = re.compile(r'\.\W*$')
+
+class PageBreak (object):
+    def __init__(self, page_num):
+        self.page_num = page_num
+
+def read_text_line(line):
+    text = ''
+    for fmt in line:
+        for c in fmt:
+            text += c.text
+    return text
+
+def par_text(lines):
+    cur = ''
+    for line_num, line in enumerate(lines):
+        first_char = line[0][0]
+        if first_char.attrib['wordStart'] == 'false' or first_char.attrib['wordFromDictionary'] == 'false' and cur.endswith('- '):
+            cur = cur[:-2]
+        for fmt in line:
+            cur += ''.join(c.text for c in fmt)
+        if line_num + 1 != len(lines):
+            cur += ' '
+    return cur
+
+def line_end_dot(line):
+    return bool(re_par_end_dot.search(read_text_line(line)))
+
+def par_unfinished(last_line, page_w):
+    last_line_len = sum(len(fmt) for fmt in last_line)
+    if last_line_len < 15 or line_end_dot(last_line):
+        return False
+    last_line_last_char = last_line[-1][-1]
+    r = float(last_line_last_char.attrib['r'])
+    return r / page_w > 0.75
+
+def col_unfinished(last_line):
+    return sum(len(fmt) for fmt in last_line) > 14 and not line_end_dot(last_line)
+
+def par_iter(ia):
+    f = open(ia + '_abbyy')
+    incomplete_par = None
+    end_column_par = None
+    skipped_par = []
+    #for page_num, (eve, page) in enumerate(iterparse(f, tag=page_tag)):
+    for page_num, (eve, page) in enumerate(iterparse(f)):
+        if page.tag != page_tag:
+            continue
+        if incomplete_par is None:
+            yield [PageBreak(page_num)]
+
+        page_w = float(page.attrib['width'])
+        assert page.tag == page_tag
+
+        for block_num, block in enumerate(page):
+            if block.attrib['blockType'] != 'Text':
+                continue
+            region, text = block
+            for par_num, par in enumerate(text):
+                if len(par) == 0 or len(par[0]) == 0 or len(par[0][0]) == 0:
+                    continue
+                last_line = par[-1]
+                if end_column_par is not None:
+                    if line_end_dot(last_line) and int(par[0].attrib['t']) < int(end_column_par[0].attrib['b']):
+                        print('end column par')
+                        yield list(end_column_par) + list(par)
+                        end_column_par = None
+                        continue
+                    else:
+                        yield list(end_column_par)
+                    end_column_par = None
+
+                if incomplete_par is not None:
+                    if line_end_dot(last_line):
+                        yield list(incomplete_par) + [PageBreak(page_num)] + list(par)
+                        for p in skipped_par:
+                            yield list(p)
+                        incomplete_par = None
+                        skipped_par = []
+                    else:
+                        skipped_par.append(par)
+                elif par_num + 1 == len(text) and block_num + 1 == len(page) and par_unfinished(last_line, page_w):
+                        incomplete_par = par
+                elif par_num + 1 == len(text) and block_num + 1 != len(page) and col_unfinished(last_line):
+                        end_column_par = par
+                else:
+                    yield list(par)
+
+        page.clear()
+
+for lines in par_iter(sys.argv[1]):
+    lines = [l for l in lines if not isinstance(l, PageBreak)]
+    text = par_text(lines)
+    print(text.encode('utf-8'))
+    print()
diff --git a/ia-legacy-importer/ia/get_loaded.py b/ia-legacy-importer/ia/get_loaded.py
new file mode 100644
index 00000000..13022012
--- /dev/null
+++ b/ia-legacy-importer/ia/get_loaded.py
@@ -0,0 +1,12 @@
+from __future__ import print_function
+from catalog.read_rc import read_rc
+import web
+import sys
+rc = read_rc()
+web.config.db_parameters = dict(dbn='postgres', db=rc['db'], user=rc['user'], pw=rc['pw'], host=rc['host'])
+web.load()
+
+iter = web.select('version', what='machine_comment', where="machine_comment like 'ia:%%'")
+
+for row in iter:
+    print(row.machine_comment[3:])
diff --git a/ia-legacy-importer/ia/parse_abbyy.py b/ia-legacy-importer/ia/parse_abbyy.py
new file mode 100644
index 00000000..527b6974
--- /dev/null
+++ b/ia-legacy-importer/ia/parse_abbyy.py
@@ -0,0 +1,85 @@
+from __future__ import print_function
+from lxml.etree import iterparse, tostring
+import re
+
+ns = '{http://www.abbyy.com/FineReader_xml/FineReader6-schema-v1.xml}'
+page_tag = ns + 'page'
+block_tag = ns + 'block'
+region_tag = ns + 'region'
+text_tag = ns + 'text'
+rect_tag = ns + 'rect'
+par_tag = ns + 'par'
+line_tag = ns + 'line'
+formatting_tag = ns + 'formatting'
+charParams_tag = ns + 'charParams'
+
+re_page_num = re.compile(r'^\[?\d+\]?$')
+
+def abbyy_to_par(f, debug=False):
+    prev = ''
+    page_count = 0
+    for event, element in iterparse(f):
+        if element.tag == page_tag:
+            page_count+= 1
+            if debug:
+                print('page', page_count)
+            page_break = True
+            for block in element:
+                assert block.tag == block_tag
+                if block.attrib['blockType'] in ('Picture', 'Table'):
+                    continue
+                assert block.attrib['blockType'] == 'Text'
+                assert len(block) in (1, 2)
+                region = block[0]
+                assert region.tag == region_tag
+                text = []
+                if len(block) == 2:
+                    e_text = block[1]
+                    assert e_text.tag == text_tag
+                if debug:
+                    print('block', block.attrib)
+                first_line_in_block = True
+                for par in e_text:
+                    assert par.tag == par_tag
+                    text = ''
+                    for line in par:
+                        assert line.tag == line_tag
+                        for formatting in line:
+                            assert formatting.tag == formatting_tag
+                            cur = ''.join(e.text for e in formatting)
+                            if first_line_in_block:
+                                first_line_in_block = False
+                                if re_page_num.match(cur.strip()):
+                                    if debug:
+                                        print('page number:', cur)
+                                    continue
+                            if formatting[0].attrib['wordStart'] == 'true' and text and text[-1] != ' ':
+                                text += ' '
+                            if cur != ' ' and formatting[0].attrib['wordStart'] == 'false' and text and text[-1] == '-':
+                                text = text[:-1] + cur
+                            else:
+                                text += cur
+                            for charParams in formatting:
+                                assert charParams.tag == charParams_tag
+                    if text == '':
+                        continue
+                    if page_break:
+                        if prev and text[0].islower():
+                            if prev[-1] == '-':
+                                prev = prev[:-1] + text
+                            else:
+                                prev += ' ' + text
+                            continue
+                        page_break = False
+                    if prev:
+                        yield prev
+                    prev = text
+
+            element.clear()
+    if prev:
+        yield prev
+
+if __name__ == '__main__':
+    import sys
+    for i in abbyy_to_par(sys.stdin, debug=False):
+        print(i.encode('utf-8'))
diff --git a/ia-legacy-importer/ia/scan_img.py b/ia-legacy-importer/ia/scan_img.py
new file mode 100644
index 00000000..3f817814
--- /dev/null
+++ b/ia-legacy-importer/ia/scan_img.py
@@ -0,0 +1,134 @@
+from __future__ import print_function
+import httplib
+import xml.etree.ElementTree as et
+import xml.parsers.expat
+import socket # for exceptions
+import re
+from openlibrary.catalog.get_ia import urlopen_keep_trying
+from openlibrary.utils.ia import find_item
+
+from six.moves import urllib
+
+
+re_remove_xmlns = re.compile(' xmlns="[^"]+"')
+
+def parse_scandata_xml(xml):
+    xml = re_remove_xmlns.sub('', xml)
+    tree = et.fromstring(xml)
+    leaf = None
+    leafNum = None
+    cover = None
+    title = None
+    for e in tree.find('pageData'):
+        assert e.tag == 'page'
+        leaf = int(e.attrib['leafNum'])
+        if leaf > 25: # enough
+            break
+        page_type = e.findtext('pageType')
+        if page_type == 'Cover':
+            cover = leaf
+        elif page_type == 'Title Page' or page_type == 'Title':
+            title = leaf
+            break
+    return (cover, title)
+
+def zip_test(ia_host, ia_path, ia, zip_type):
+    conn = httplib.HTTPConnection(ia_host)
+    conn.request('HEAD', ia_path + "/" + ia + "_" + zip_type + ".zip")
+    r1 = conn.getresponse()
+    try:
+        assert r1.status in (200, 403, 404)
+    except AssertionError:
+        print(r1.status, r1.reason)
+        raise
+    return r1.status
+
+def find_title_leaf_et(ia_host, ia_path, scandata):
+    return parse_scandata_xml(scandata)
+
+def find_title(item_id):
+    (ia_host, ia_path) = find_item(item_id)
+
+    if not ia_host:
+        return
+    url = 'http://' + ia_host + ia_path + "/" + item_id + "_scandata.xml"
+    scandata = None
+    try:
+        scandata = urlopen_keep_trying(url).read()
+    except:
+        pass
+    if not scandata or '<book>' not in scandata[:100]:
+        url = "http://" + ia_host + "/zipview.php?zip=" + ia_path + "/scandata.zip&file=scandata.xml"
+        scandata = urlopen_keep_trying(url).read()
+    if not scandata or '<book>' not in scandata:
+        return
+
+    zip_type = 'tif' if item_id.endswith('goog') else 'jp2'
+    try:
+        status = zip_test(ia_host, ia_path, item_id, zip_type)
+    except socket.error:
+        #print 'socket error:', ia_host
+        bad_hosts.add(ia_host)
+        return
+    if status in (403, 404):
+        #print zip_type, ' not found:', item_id
+        return
+
+    (cover, title) = parse_scandata_xml(scandata)
+    return title
+
+def find_img(item_id):
+    (ia_host, ia_path) = find_item(item_id)
+
+    if not ia_host:
+        print('no host', item_id, ia_host)
+        return
+    url = 'http://' + ia_host + ia_path + "/" + item_id + "_scandata.xml"
+    scandata = None
+    try:
+        scandata = urlopen_keep_trying(url).read()
+    except:
+        pass
+    if not scandata or '<book>' not in scandata[:100]:
+        url = "http://" + ia_host + "/zipview.php?zip=" + ia_path + "/scandata.zip&file=scandata.xml"
+        scandata = urlopen_keep_trying(url).read()
+    if not scandata or '<book>' not in scandata:
+        return {}
+
+    zip_type = 'tif' if item_id.endswith('goog') else 'jp2'
+    try:
+        status = zip_test(ia_host, ia_path, item_id, zip_type)
+    except socket.error:
+        print('socket error:', ia_host)
+        bad_hosts.add(ia_host)
+        return
+    if status in (403, 404):
+        print(zip_type, ' not found:', item_id)
+        return
+
+    (cover, title) = parse_scandata_xml(scandata)
+    return {
+        'item_id': item_id,
+        'ia_host': ia_host,
+        'ia_path': ia_path,
+        'cover': cover,
+        'title': title
+    }
+
+def test_find_img():
+    flatland ='flatlandromanceo00abbouoft'
+    ret = find_img(flatland)
+    assert ret['item_id'] == 'flatlandromanceo00abbouoft'
+    assert ret['cover'] == 1
+    assert ret['title'] == 7
+
+def test_find_img2():
+    item_id = 'cu31924000331631'
+    ret = find_img(item_id)
+    assert ret['item_id'] == item_id
+    assert ret['cover'] is None
+    assert ret['title'] == 0
+
+def test_no_full_text():
+    item_id = 'histoirepopulair02cabeuoft'
+    print(find_img(item_id))
diff --git a/ia-legacy-importer/ia/scanned_identifiers.py b/ia-legacy-importer/ia/scanned_identifiers.py
new file mode 100644
index 00000000..4c98b98d
--- /dev/null
+++ b/ia-legacy-importer/ia/scanned_identifiers.py
@@ -0,0 +1,12 @@
+from __future__ import print_function
+from catalog.read_rc import read_rc
+import web
+import sys
+rc = read_rc()
+web.config.db_parameters = dict(dbn='mysql', db='archive', user=rc['ia_db_user'], pw=rc['ia_db_pass'], host=rc['ia_db_host'])
+web.load()
+
+iter = web.select('metadata', where="scanner != 'google' and noindex is null and mediatype='texts'")
+
+for row in iter:
+    print(row.identifier)
diff --git a/ia-legacy-importer/ia/to_load.py b/ia-legacy-importer/ia/to_load.py
new file mode 100644
index 00000000..1e3427dc
--- /dev/null
+++ b/ia-legacy-importer/ia/to_load.py
@@ -0,0 +1,7 @@
+from __future__ import print_function
+scanned = set(i[:-1] for i in open('scanned'))
+loaded = set(i[:-1] for i in open('loaded'))
+
+to_load = scanned - loaded
+for i in sorted(to_load):
+    print(i)
diff --git a/ia-legacy-importer/importer/__init__.py b/ia-legacy-importer/importer/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/ia-legacy-importer/importer/add_source_records.py b/ia-legacy-importer/importer/add_source_records.py
new file mode 100755
index 00000000..0ad6c192
--- /dev/null
+++ b/ia-legacy-importer/importer/add_source_records.py
@@ -0,0 +1,188 @@
+#!/usr/bin/python2.5
+from __future__ import print_function
+from time import time, sleep
+import catalog.marc.fast_parse as fast_parse
+import web
+import sys
+import codecs
+import re
+import catalog.importer.pool as pool
+from catalog.utils.query import query_iter
+from catalog.importer.merge import try_merge
+from catalog.marc.new_parser import read_edition
+from catalog.importer.load import build_query
+from catalog.get_ia import files, read_marc_file
+from catalog.merge.merge_marc import build_marc
+from catalog.importer.db_read import get_mc, withKey
+from openlibrary.api import OpenLibrary
+
+from catalog.read_rc import read_rc
+
+import six
+
+rc = read_rc()
+
+marc_index = web.database(dbn='postgres', db='marc_index')
+marc_index.printing = False
+
+db_amazon = web.database(dbn='postgres', db='amazon')
+db_amazon.printing = False
+
+ol = OpenLibrary("http://openlibrary.org")
+ol.login('ImportBot', rc['ImportBot'])
+
+sys.stdout = codecs.getwriter('utf-8')(sys.stdout)
+
+t0 = time()
+t_prev = time()
+rec_no = 0
+chunk = 50
+load_count = 0
+
+archive_id = sys.argv[1]
+
+def percent(a, b):
+    return float(a * 100.0) / b
+
+def progress(archive_id, rec_no, start_pos, pos):
+    global t_prev, load_count
+    cur_time = time()
+    t = cur_time - t_prev
+    t_prev = cur_time
+    t1 = cur_time - t0
+    rec_per_sec = chunk / t
+    bytes_per_sec_total = (pos - start_pos) / t1
+
+    q = {
+        'chunk': chunk,
+        'rec_no': rec_no,
+        't': t,
+        't1': t1,
+        'part': part,
+        'pos': pos,
+        'load_count': load_count,
+        'time': cur_time,
+        'bytes_per_sec_total': bytes_per_sec_total,
+    }
+    pool.post_progress(archive_id, q)
+
+def is_loaded(loc):
+    assert loc.startswith('marc:')
+    vars = {'loc': loc[5:]}
+    db_iter = marc_index.query('select * from machine_comment where v=$loc', vars)
+    if list(db_iter):
+        return True
+    iter = query_iter({'type': '/type/edition', 'source_records': loc})
+    return bool(list(iter))
+
+re_meta_mrc = re.compile('^([^/]*)_meta.mrc:0:\d+$')
+
+def amazon_source_records(asin):
+    iter = db_amazon.select('amazon', where='asin = $asin', vars={'asin':asin})
+    return ["amazon:%s:%s:%d:%d" % (asin, r.seg, r.start, r.length) for r in iter]
+
+def fix_toc(e):
+    toc = e.get('table_of_contents')
+    if not toc:
+        return
+    if isinstance(toc[0], dict) and toc[0]['type'] == '/type/toc_item':
+        return
+    return [{'title': six.text_type(i), 'type': '/type/toc_item'} for i in toc if i != u'']
+
+re_skip = re.compile('\b([A-Z]|Co|Dr|Jr|Capt|Mr|Mrs|Ms|Prof|Rev|Revd|Hon)\.$')
+
+def has_dot(s):
+    return s.endswith('.') and not re_skip.search(s)
+
+def add_source_records(key, new, thing):
+    sr = None
+    e = ol.get(key)
+    if 'source_records' in e:
+        if new in e['source_records']:
+            return
+        e['source_records'].append(new)
+    else:
+        existing = get_mc(key)
+        amazon = 'amazon:'
+        if existing.startswith(amazon):
+            sr = amazon_source_records(existing[len(amazon):]) or [existing]
+        else:
+            m = re_meta_mrc.match(existing)
+            sr = ['marc:' + existing if not m else 'ia:' + m.group(1)]
+        assert new not in sr
+        e['source_records'] = sr + [new]
+
+    # fix other bits of the record as well
+    new_toc = fix_toc(e)
+    if new_toc:
+        e['table_of_contents'] = new_toc
+    if e.get('subjects', None) and any(has_dot(s) for s in e['subjects']):
+        subjects = [s[:-1] if has_dot(s) else s for s in e['subjects']]
+        e['subjects'] = subjects
+    print(ol.save(key, e, 'found a matching MARC record'))
+    if new_toc:
+        new_edition = ol.get(key)
+        # [{u'type': <ref: u'/type/toc_item'>}, ...]
+        assert 'title' in new_edition['table_of_contents'][0]
+
+def load_part(archive_id, part, start_pos=0):
+    print('load_part:', archive_id, part)
+    global rec_no, t_prev, load_count
+    full_part = archive_id + "/" + part
+    f = open(rc['marc_path'] + "/" + full_part)
+    if start_pos:
+        f.seek(start_pos)
+    for pos, loc, data in read_marc_file(full_part, f, pos=start_pos):
+        rec_no += 1
+        if rec_no % chunk == 0:
+            progress(archive_id, rec_no, start_pos, pos)
+
+        if is_loaded(loc):
+            continue
+        want = ['001', '003', '010', '020', '035', '245']
+        try:
+            index_fields = fast_parse.index_fields(data, want)
+        except KeyError:
+            print(loc)
+            print(fast_parse.get_tag_lines(data, ['245']))
+            raise
+        except AssertionError:
+            print(loc)
+            raise
+        if not index_fields or 'title' not in index_fields:
+            continue
+
+        edition_pool = pool.build(index_fields)
+
+        if not edition_pool:
+            continue
+
+        rec = fast_parse.read_edition(data)
+        e1 = build_marc(rec)
+
+        match = False
+        seen = set()
+        for k, v in edition_pool.iteritems():
+            for edition_key in v:
+                if edition_key in seen:
+                    continue
+                seen.add(edition_key)
+                thing = withKey(edition_key)
+                assert thing
+                if try_merge(e1, edition_key, thing):
+                    add_source_records(edition_key, loc, thing)
+                    match = True
+
+        if not match:
+            yield loc, data
+
+start = pool.get_start(archive_id)
+go = 'part' not in start
+
+print(archive_id)
+
+for part, size in files(archive_id):
+    print(part, size)
+    load_part(archive_id, part)
+
+print("finished")
diff --git a/ia-legacy-importer/importer/db_read.py b/ia-legacy-importer/importer/db_read.py
new file mode 100644
index 00000000..aed44bfb
--- /dev/null
+++ b/ia-legacy-importer/importer/db_read.py
@@ -0,0 +1,75 @@
+from __future__ import print_function
+import web
+import simplejson as json
+from time import sleep
+from openlibrary.catalog.read_rc import read_rc
+
+from six.moves.urllib.parse import urlencode
+from six.moves.urllib.request import urlopen
+
+
+staging = False
+
+db = web.database(dbn='postgres', db='marc_index', host='ol-db')
+db.printing = False
+
+def find_author(name): # unused
+    iter = web.query('select key from thing, author_str where thing_id = id and key_id = 1 and value = $name', {'name': name })
+    return [row.key for row in iter]
+
+def read_from_url(url):
+    data = None
+    for i in range(20):
+        try:
+            data = urlopen(url).read()
+            if data:
+                break
+            print('data == None')
+        except IOError:
+            print('IOError')
+            print(url)
+        sleep(10)
+    if not data:
+        return None
+    ret = json.loads(data)
+    if ret['status'] == 'fail' and ret['message'].startswith('Not Found: '):
+        return None
+    if ret['status'] != 'ok':
+        print(ret)
+    assert ret['status'] == 'ok'
+    return ret['result']
+
+def set_staging(v):
+    global staging
+    staging = v
+
+def api_url():
+    return "https://openlibrary.org%s/api/" % (':8080' if staging else '')
+
+def api_versions(): return api_url() + "versions?"
+def api_things(): return api_url() + "things?"
+def api_get(): return api_url() + "get?key="
+
+def get_versions(q): # unused
+    url = api_versions() + urlencode({'query': json.dumps(q)})
+    return read_from_url(url)
+
+def get_things(q):
+    url = api_things() + urlencode({'query': json.dumps(q)})
+    return read_from_url(url)
+
+def get_mc(key):
+    found = list(db.query('select v from machine_comment where k=$key', {'key': key}))
+    return found[0].v if found else None
+
+def withKey(key):
+    def process(key):
+        return read_from_url(api_get() + key)
+
+    for attempt in range(5):
+        try:
+            return process(key)
+        except ValueError:
+            pass
+        sleep(10)
+    return process(key)
diff --git a/ia-legacy-importer/importer/from_scribe.py b/ia-legacy-importer/importer/from_scribe.py
new file mode 100644
index 00000000..9a164930
--- /dev/null
+++ b/ia-legacy-importer/importer/from_scribe.py
@@ -0,0 +1,156 @@
+from __future__ import print_function
+import MySQLdb
+from catalog.read_rc import read_rc
+import catalog.marc.fast_parse as fast_parse
+import catalog.marc.parse_xml as parse_xml
+from time import time
+from lang import add_lang
+from olwrite import Infogami
+from load import build_query
+from merge import try_merge
+from db_read import get_things
+from catalog.get_ia import get_ia, urlopen_keep_trying
+from catalog.merge.merge_marc import build_marc
+import pool
+import sys
+
+from six.moves import urllib
+
+
+archive_url = "http://archive.org/download/"
+
+rc = read_rc()
+
+infogami = Infogami('pharosdb.us.archive.org:7070')
+infogami.login('ImportBot', rc['ImportBot'])
+
+conn = MySQLdb.connect(host=rc['ia_db_host'], user=rc['ia_db_user'], \
+        passwd=rc['ia_db_pass'], db='archive')
+cur = conn.cursor()
+
+#collection = sys.argv[1]
+
+#print 'loading from collection: %s' % collection
+
+def read_short_title(title):
+    return str(fast_parse.normalize_str(title)[:25])
+
+def make_index_fields(rec):
+    fields = {}
+    for k, v in rec.iteritems():
+        if k in ('lccn', 'oclc', 'isbn'):
+            fields[k] = v
+            continue
+        if k == 'full_title':
+            fields['title'] = [read_short_title(v)]
+    return fields
+
+def write_edition(loc, edition):
+    add_lang(edition)
+    q = build_query(loc, edition)
+
+    for a in (i for i in q.get('authors', []) if 'key' not in i):
+        a['key'] = infogami.new_key('/type/author')
+
+    key = infogami.new_key('/type/edition')
+    last_key = key
+    q['key'] = key
+    ret = infogami.write(q, comment='initial import', machine_comment=loc)
+    assert ret['status'] == 'ok'
+    print(ret)
+    pool.update(key, q)
+
+def load():
+    global rec_no, t_prev
+    skipping = False
+    #for ia in ['nybc200715']:
+    #cur.execute("select identifier from metadata where collection=%(c)s", {'c': collection})
+    cur.execute("select identifier from metadata where scanner is not null and scanner != 'google' and noindex is null and mediatype='texts' and curatestate='approved'") # order by curatedate")
+    for ia, in cur.fetchall():
+        rec_no += 1
+        if rec_no % chunk == 0:
+            t = time() - t_prev
+            t_prev = time()
+            t1 = time() - t0
+            rec_per_sec = chunk / t
+            rec_per_sec_total = rec_no / t1
+            remaining = total - rec_no
+            sec = remaining / rec_per_sec_total
+            print("%8d current: %9.3f overall: %9.3f" % (rec_no, rec_per_sec, rec_per_sec_total), end=' ')
+            hours = sec / 3600
+            print("%6.3f hours" % hours)
+
+        print(ia)
+        if get_things({'type': '/type/edition', 'ocaid': ia}):
+            print('already loaded')
+            continue
+        try:
+            loc, rec = get_ia(ia)
+        except (KeyboardInterrupt, NameError):
+            raise
+        except urllib.error.HTTPError:
+            continue
+        if loc is None:
+            continue
+        print(loc, rec)
+
+        if not loc.endswith('.xml'):
+            print("not XML")
+            continue
+        if 'full_title' not in rec:
+            print("full_title missing")
+            continue
+        index_fields = make_index_fields(rec)
+        if not index_fields:
+            print("no index_fields")
+            continue
+
+        edition_pool = pool.build(index_fields)
+        print(edition_pool)
+
+        if not edition_pool:
+            yield loc, ia
+            continue
+
+        e1 = build_marc(rec)
+
+        match = False
+        for k, v in edition_pool.iteritems():
+            if k == 'title' and len(v) > 50:
+                continue
+            for edition_key in v:
+                if try_merge(e1, edition_key.replace('\/', '/')):
+                    match = True
+                    break
+            if match:
+                break
+        if not match:
+            yield loc, ia
+
+t0 = time()
+t_prev = time()
+chunk = 50
+last_key = None
+load_count = 0
+rec_no = 0
+total = 100000
+
+for loc, ia in load():
+    print("load", loc, ia)
+    url = archive_url + loc
+    f = urlopen_keep_trying(url)
+    try:
+        edition = parse_xml.parse(f)
+    except AssertionError:
+        continue
+    except parse_xml.BadSubtag:
+        continue
+    except KeyError:
+        continue
+    if 'title' not in edition:
+        continue
+    edition['ocaid'] = ia
+    write_edition("ia:" + ia, edition)
+
+
+print("finished")
diff --git a/ia-legacy-importer/importer/import_imagepdf.py b/ia-legacy-importer/importer/import_imagepdf.py
new file mode 100644
index 00000000..654a5bf8
--- /dev/null
+++ b/ia-legacy-importer/importer/import_imagepdf.py
@@ -0,0 +1,27 @@
+from __future__ import print_function
+import web
+import sys
+from catalog.utils.query import query, withKey
+from catalog.read_rc import read_rc
+sys.path.append('/home/edward/src/olapi')
+from olapi import OpenLibrary, unmarshal
+
+rc = read_rc()
+ol = OpenLibrary("http://openlibrary.org")
+ol.login('ImportBot', rc['ImportBot'])
+
+db = web.database(dbn='mysql', host=rc['ia_db_host'], user=rc['ia_db_user'], \
+        passwd=rc['ia_db_pass'], db='archive')
+db.printing = False
+
+iter = db.query("select identifier from metadata where noindex is null and mediatype='texts' and scanner='google'")
+
+for i in iter:
+    ia = i.identifier
+    print(ia)
+    if query({'type': '/type/edition', 'ocaid': ia}):
+        print('already loaded')
+        continue
+    if query({'type': '/type/edition', 'source_records': 'ia:' + ia}):
+        print('already loaded')
+        continue
diff --git a/ia-legacy-importer/importer/import_marc.py b/ia-legacy-importer/importer/import_marc.py
new file mode 100755
index 00000000..e23ae40c
--- /dev/null
+++ b/ia-legacy-importer/importer/import_marc.py
@@ -0,0 +1,389 @@
+#!/usr/bin/python2.5
+from __future__ import print_function
+from six.moves import urllib
+from time import time, sleep
+import openlibrary.catalog.marc.fast_parse as fast_parse
+from openlibrary.catalog.marc.marc_binary import MarcBinary
+import web
+import sys
+import codecs
+import re
+import httplib
+from openlibrary.catalog.importer import pool
+import simplejson as json
+from openlibrary.catalog.utils.query import query_iter
+from openlibrary.catalog.importer.merge import try_merge
+from openlibrary.catalog.marc.parse import read_edition
+from openlibrary.catalog.importer.load import build_query, east_in_by_statement, import_author
+from openlibrary.catalog.works.find_work_for_edition import find_matching_work
+from openlibrary.catalog.get_ia import files, read_marc_file
+from openlibrary.catalog.merge.merge_marc import build_marc
+from openlibrary.catalog.importer.db_read import get_mc, withKey
+from openlibrary.catalog.marc.marc_subject import subjects_for_work
+from openlibrary.api import OpenLibrary, unmarshal
+import six
+
+from openlibrary.catalog.read_rc import read_rc
+
+rc = read_rc()
+
+marc_index = web.database(dbn='postgres', db='marc_index')
+marc_index.printing = True
+
+db_amazon = web.database(dbn='postgres', db='amazon')
+db_amazon.printing = False
+
+ol = OpenLibrary("http://openlibrary.org")
+ol.login('ImportBot', rc['ImportBot'])
+
+sys.stdout = codecs.getwriter('utf-8')(sys.stdout)
+
+t0 = time()
+t_prev = time()
+rec_no = 0
+chunk = 50
+load_count = 0
+
+re_edition_key = re.compile('^/(?:books|b)/(OL\d+M)$')
+
+archive_id = sys.argv[1]
+
+def get_with_retry(key):
+    for i in range(3):
+        try:
+            return ol.get(key)
+        except urllib.error.HTTPError as error:
+            if error.code != 500:
+                raise
+        print('retry save')
+        sleep(10)
+    return ol.get(key)
+
+def save_with_retry(key, data, comment):
+    for i in range(3):
+        try:
+            return ol.save(key, data, comment)
+        except urllib.error.HTTPError as error:
+            if error.code != 500:
+                raise
+        print('retry save')
+        sleep(10)
+
+# urllib.error.HTTPError: HTTP Error 500: Internal Server Error
+
+def percent(a, b):
+    return float(a * 100.0) / b
+
+def progress(archive_id, rec_no, start_pos, pos):
+    global t_prev, load_count
+    cur_time = time()
+    t = cur_time - t_prev
+    t_prev = cur_time
+    t1 = cur_time - t0
+    rec_per_sec = chunk / t
+    bytes_per_sec_total = (pos - start_pos) / t1
+
+    q = {
+        'chunk': chunk,
+        'rec_no': rec_no,
+        't': t,
+        't1': t1,
+        'part': part,
+        'pos': pos,
+        'load_count': load_count,
+        'time': cur_time,
+        'bytes_per_sec_total': bytes_per_sec_total,
+    }
+    pool.post_progress(archive_id, q)
+
+def is_loaded(loc):
+    assert loc.startswith('marc:')
+    vars = {'loc': loc[5:]}
+    db_iter = marc_index.query('select * from machine_comment where v=$loc', vars)
+    if list(db_iter):
+        return True
+    iter = query_iter({'type': '/type/edition', 'source_records': loc})
+    return bool(list(iter))
+
+re_meta_mrc = re.compile('^([^/]*)_meta.mrc:0:\d+$')
+
+def amazon_source_records(asin):
+    iter = db_amazon.select('amazon', where='asin = $asin', vars={'asin':asin})
+    return ["amazon:%s:%s:%d:%d" % (asin, r.seg, r.start, r.length) for r in iter]
+
+def fix_toc(e):
+    toc = e.get('table_of_contents', None)
+    if not toc:
+        return
+    if isinstance(toc[0], dict) and toc[0]['type'] == '/type/toc_item':
+        return
+    return [{'title': six.text_type(i), 'type': '/type/toc_item'} for i in toc if i != u'']
+
+re_skip = re.compile('\b([A-Z]|Co|Dr|Jr|Capt|Mr|Mrs|Ms|Prof|Rev|Revd|Hon)\.$')
+
+def has_dot(s):
+    return s.endswith('.') and not re_skip.search(s)
+
+def author_from_data(loc, data):
+    edition = read_edition(data)
+    assert 'authors' in edition
+    east = east_in_by_statement(edition)
+    assert len(edition['authors']) == 1
+    print(repr(edition['authors'][0]))
+    a = import_author(edition['authors'][0], eastern=east)
+    if 'key' in a:
+        return {'key': a['key']}
+    ret = ol.new(a, comment='new author')
+    print('ret:', ret)
+    assert isinstance(ret, six.string_types)
+    return {'key': ret}
+
+def undelete_author(a):
+    key = a['key']
+    assert a['type'] == '/type/delete'
+    url = 'http://openlibrary.org' + key + '.json?v=' + str(a['revision'] - 1)
+    prev = unmarshal(json.load(urllib.request.urlopen(url)))
+    assert prev['type'] == '/type/author'
+    save_with_retry(key, prev, 'undelete author')
+
+def undelete_authors(authors):
+    for a in authors:
+        if a['type'] == '/type/delete':
+            undelete_author(a)
+        else:
+            print(a)
+            assert a['type'] == '/type/author'
+
+def add_source_records(key, new, thing, data):
+    sr = None
+    e = get_with_retry(key)
+    if 'source_records' in e:
+        if new in e['source_records']:
+            return
+        e['source_records'].append(new)
+    else:
+        existing = get_mc(key)
+        amazon = 'amazon:'
+        if existing.startswith('ia:'):
+            sr = [existing]
+        elif existing.startswith(amazon):
+            sr = amazon_source_records(existing[len(amazon):]) or [existing]
+        else:
+            m = re_meta_mrc.match(existing)
+            sr = ['marc:' + existing if not m else 'ia:' + m.group(1)]
+        assert new not in sr
+        e['source_records'] = sr + [new]
+
+    # fix other bits of the record as well
+    new_toc = fix_toc(e)
+    if new_toc:
+        e['table_of_contents'] = new_toc
+    if e.get('subjects', None) and any(has_dot(s) for s in e['subjects']):
+        subjects = [s[:-1] if has_dot(s) else s for s in e['subjects']]
+        e['subjects'] = subjects
+    if 'authors' in e:
+        if any(a=='None' for a in e['authors']):
+            assert len(e['authors']) == 1
+            new_author = author_from_data(new, data)
+            e['authors'] = [new_author]
+        else:
+            print(e['authors'])
+            authors = [get_with_retry(akey) for akey in e['authors']]
+            while any(a['type'] == '/type/redirect' for a in authors):
+                print('following redirects')
+                authors = [ol.get(a['location']) if a['type'] == '/type/redirect' else a for a in authors]
+            e['authors'] = [{'key': a['key']} for a in authors]
+            undelete_authors(authors)
+    try:
+        print(save_with_retry(key, e, 'found a matching MARC record'))
+    except:
+        print(e)
+        raise
+    if new_toc:
+        new_edition = ol.get(key)
+        # [{u'type': <ref: u'/type/toc_item'>}, ...]
+        assert 'title' in new_edition['table_of_contents'][0]
+
+def load_part(archive_id, part, start_pos=0):
+    print('load_part:', archive_id, part)
+    global rec_no, t_prev, load_count
+    full_part = archive_id + "/" + part
+    f = open(rc['marc_path'] + "/" + full_part)
+    if start_pos:
+        f.seek(start_pos)
+    for pos, loc, data in read_marc_file(full_part, f, pos=start_pos):
+        rec_no += 1
+        if rec_no % chunk == 0:
+            progress(archive_id, rec_no, start_pos, pos)
+
+        if is_loaded(loc):
+            continue
+        want = ['001', '003', '010', '020', '035', '245']
+        try:
+            index_fields = fast_parse.index_fields(data, want)
+        except KeyError:
+            print(loc)
+            print(fast_parse.get_tag_lines(data, ['245']))
+            raise
+        except AssertionError:
+            print(loc)
+            raise
+        except fast_parse.NotBook:
+            continue
+        if not index_fields or 'title' not in index_fields:
+            continue
+
+        print(loc)
+        edition_pool = pool.build(index_fields)
+
+        if not edition_pool:
+            yield loc, data
+            continue
+
+        rec = fast_parse.read_edition(data)
+        e1 = build_marc(rec)
+
+        match = False
+        seen = set()
+        for k, v in edition_pool.iteritems():
+            for edition_key in v:
+                if edition_key in seen:
+                    continue
+                thing = None
+                while not thing or thing['type']['key'] == '/type/redirect':
+                    seen.add(edition_key)
+                    thing = withKey(edition_key)
+                    assert thing
+                    if thing['type']['key'] == '/type/redirect':
+                        print('following redirect %s => %s' % (edition_key, thing['location']))
+                        edition_key = thing['location']
+                if try_merge(e1, edition_key, thing):
+                    add_source_records(edition_key, loc, thing, data)
+                    match = True
+                    break
+            if match:
+                break
+
+        if not match:
+            yield loc, data
+
+start = pool.get_start(archive_id)
+go = 'part' not in start
+
+print(archive_id)
+
+def write(q): # unused
+    if 0:
+        for i in range(10):
+            try:
+                return ol.new(q, comment='initial import')
+            except (KeyboardInterrupt, NameError):
+                raise
+            except:
+                pass
+            sleep(30)
+    try:
+        return ol.new(q, comment='initial import')
+    except:
+        print(q)
+        raise
+
+def write_edition(loc, edition):
+    q = build_query(loc, edition)
+    authors = []
+    for a in q.get('authors', []):
+        if 'key' in a:
+            authors.append({'key': a['key']})
+        else:
+            try:
+                ret = ol.new(a, comment='new author')
+            except:
+                print(a)
+                raise
+            print('ret:', ret)
+            assert isinstance(ret, six.string_types)
+#            assert ret['status'] == 'ok'
+#            assert 'created' in ret and len(ret['created']) == 1
+            authors.append({'key': ret})
+    q['source_records'] = [loc]
+    if authors:
+        q['authors'] = authors
+
+    wkey = None
+    subjects = subjects_for_work(rec)
+    if 'authors' in q:
+        wkey = find_matching_work(q)
+    if wkey:
+        w = ol.get(wkey)
+        need_update = False
+        for k, subject_list in subjects.items():
+            for s in subject_list:
+                if s not in w.get(k, []):
+                    w.setdefault(k, []).append(s)
+                    need_update = True
+        if need_update:
+            ol.save(wkey, w, 'add subjects from new record')
+    else:
+        w = {
+            'type': '/type/work',
+            'title': q['title'],
+        }
+        if 'authors' in q:
+            w['authors'] = [{'type':'/type/author_role', 'author': akey} for akey in q['authors']]
+        w.update(subjects)
+
+        wkey = ol.new(w, comment='initial import')
+    q['works'] = [{'key': wkey}]
+
+    for attempt in range(5):
+        if attempt > 0:
+            print('retrying')
+        try:
+            ret = ol.new(q, comment='initial import')
+        except httplib.BadStatusLine:
+            sleep(10)
+            continue
+        except: # httplib.BadStatusLine
+            print(q)
+            raise
+        break
+    print('ret:', ret)
+    assert isinstance(ret, six.string_types)
+    key = '/b/' + re_edition_key.match(ret).group(1)
+    # get key from return
+    pool.update(key, q)
+
+    return
+
+for part, size in files(archive_id):
+#for part, size in marc_loc_updates:
+    print(part, size)
+    if not go:
+        if part == start['part']:
+            go = True
+            print("starting %s at %d" % (part, start['pos']))
+            part_iter = load_part(archive_id, part, start_pos=start['pos'])
+        else:
+            continue
+    else:
+        part_iter = load_part(archive_id, part)
+
+    for loc, data in part_iter:
+        #if loc == 'marc_binghamton_univ/bgm_openlib_final_10-15.mrc:265680068:4538':
+        #    continue
+        assert len(data) == int(data[:5])
+        rec = MarcBinary(data)
+        edition = read_edition(rec)
+        if edition['title'] == 'See.':
+            print('See.', edition)
+            continue
+        if edition['title'] == 'See also.':
+            print('See also.', edition)
+            continue
+        load_count += 1
+        if load_count % 100 == 0:
+            print("load count", load_count)
+        write_edition(loc, edition)
+        sleep(2)
+
+print("finished")
diff --git a/ia-legacy-importer/importer/import_server.py b/ia-legacy-importer/importer/import_server.py
new file mode 100755
index 00000000..46d0a78c
--- /dev/null
+++ b/ia-legacy-importer/importer/import_server.py
@@ -0,0 +1,120 @@
+#!/usr/local/bin/python2.5
+from __future__ import print_function
+import web
+import dbhash
+import sys
+import simplejson as json
+from openlibrary.catalog.load import add_keys
+from copy import deepcopy
+from openlibrary.catalog.merge.index import *
+
+from six.moves.urllib.parse import urlencode
+from six.moves.urllib.request import urlopen
+
+
+path = '/1/edward/marc_index/'
+#dbm_fields = ('lccn', 'oclc', 'isbn', 'title')
+#dbm = dict((i, dbhash.open(path + i + '.dbm', flag='w')) for i in dbm_fields)
+
+store_db = dbhash.open(path + "store.dbm", flag='w')
+
+urls = (
+#    '/', 'index',
+    '/store/(.*)', 'store',
+    '/keys', 'keys',
+)
+
+app = web.application(urls, globals())
+
+def build_pool(index_fields): # unused
+    pool = {}
+    for field in dbm_fields:
+        if not field in index_fields:
+            continue
+        for v in index_fields[field]:
+            if field == 'isbn' and len(v) < 10:
+                continue
+            try:
+                v = str(v)
+            except UnicodeEncodeError:
+                print(index_fields)
+                print(repr(field, v))
+                print(v)
+                raise
+            if v not in dbm[field]:
+                continue
+            pool.setdefault(field, set()).update(dbm[field][v].split(' '))
+    return dict((k, sorted(v)) for k, v in pool.iteritems())
+
+def add_to_indexes(record, dbm): # unused
+    if 'title' not in record or record['title'] is None:
+        return
+    if 'subtitle' in record and record['subtitle'] is not None:
+        title = record['title'] + ' ' + record['subtitle']
+    else:
+        title = record['title']
+    st = str(short_title(title))
+#    if st in dbm['title'] and id in dbm['title'][st].split(' '):
+#        return # already done
+    add_to_index(dbm['title'], st, record['key'])
+    if 'title_prefix' in record and record['title_prefix'] is not None:
+        title2 = short_title(record['title_prefix'] + title)
+        add_to_index(dbm['title'], title2, record['key'])
+
+    fields = [
+        ('lccn', 'lccn', clean_lccn),
+        ('oclc_numbers', 'oclc', None),
+        ('isbn_10', 'isbn', None),
+        ('isbn_13', 'isbn', None),
+    ]
+    for a, b, clean in fields:
+        if a not in record:
+            continue
+        for v in record[a]:
+            if not v:
+                continue
+            if clean:
+                v = clean(v)
+            add_to_index(dbm[b], v, record['key'])
+
+class index: # unused
+    def GET(self):
+        web.header('Content-Type','application/json; charset=utf-8', unique=True)
+        q = web.input()
+        fields = dict((f, q[f].split('_')) for f in dbm_fields if f in q)
+        pool = build_pool(fields)
+        print(cjson.encode({'fields': fields, 'pool': pool}))
+    def POST(self):
+        q = cjson.decode(web.data())
+        add_to_indexes(q, dbm)
+        print('success', end=' ')
+
+class store:
+    def GET(self, key):
+        web.header('Content-Type','application/json; charset=utf-8', unique=True)
+        key = str(key)
+        if key in store_db:
+            return store_db[key]
+        else:
+            error = {'error': key + " not found", 'keys': store_db.keys() }
+            return json.dumps(error)
+    def POST(self, key):
+        key = str(key)
+        store_db[key] = web.data()
+        return "saved"
+
+class keys:
+    def GET(self):
+        web.header('Content-Type','application/json; charset=utf-8', unique=True)
+        return json.dumps(store_db.keys())
+
+if __name__ == '__main__':
+    try:
+        app.run()
+    except:
+        print("closing dbm files")
+#        for v in dbm.itervalues():
+#            v.close()
+        store_db.close()
+        print("closed")
+        raise
diff --git a/ia-legacy-importer/importer/lang.py b/ia-legacy-importer/importer/lang.py
new file mode 100644
index 00000000..1a6a131e
--- /dev/null
+++ b/ia-legacy-importer/importer/lang.py
@@ -0,0 +1,23 @@
+from db_read import get_things
+
+def get_langs():
+    lang = []
+    offset = 0
+    while True:
+        i = get_things({'type': '/type/language', 'limit': 100, 'offset': offset})
+        lang += i
+        if len(i) != 100:
+            break
+        offset += 100
+    return set(lang)
+
+languages = get_langs()
+
+def add_lang(edition):
+    if 'languages' not in edition:
+        return
+    lang_key = edition['languages'][0]['key']
+    if lang_key in ('/l/   ', '/l/|||'):
+        del edition['languages']
+    elif lang_key not in languages:
+        del edition['languages']
diff --git a/ia-legacy-importer/importer/load.py b/ia-legacy-importer/importer/load.py
new file mode 100644
index 00000000..294e1959
--- /dev/null
+++ b/ia-legacy-importer/importer/load.py
@@ -0,0 +1,232 @@
+from __future__ import print_function
+import web
+import re
+import os
+from db_read import withKey
+from openlibrary.catalog.utils import flip_name, author_dates_match, key_int
+from openlibrary.catalog.utils.query import query_iter
+from openlibrary.catalog.read_rc import read_rc
+from openlibrary.api import OpenLibrary
+
+rc = read_rc()
+ol = OpenLibrary("http://openlibrary.org")
+ol.login('ImportBot', rc['ImportBot'])
+
+password = open(os.path.expanduser('~/.openlibrary_db_password')).read()
+if password.endswith('\n'):
+    password = password[:-1]
+db_error = web.database(dbn='postgres', db='ol_errors', host='localhost', user='openlibrary', pw=password)
+
+def walk_redirects(obj, seen):
+    # called from find_author
+    # uses ol client API
+    seen.add(obj['key'])
+    while obj['type'] == '/type/redirect':
+        assert obj['location'] != obj['key']
+        obj = ol.get(obj['location'])
+        seen.add(obj['key'])
+    return obj
+
+def find_author(name, log_errors=True):
+    q = {'type': '/type/author', 'name': name, 'limit': 0}
+    reply = list(ol.query(q))
+    authors = [ol.get(k) for k in reply]
+    if any(a['type'] != '/type/author' for a in authors):
+        if log_errors:
+            result = ''
+            for a in authors:
+                if a['type'] == '/type/redirect':
+                    result += a['key'] + ' redirects to ' + a['location'] + '\n'
+                elif a['type'] == '/type/delete':
+                    result += a['key'] + ' is deleted ' + '\n'
+                elif a['type'] == '/type/author':
+                    result += a['key'] + ' is an author: ' + a['name'] + '\n'
+                else:
+                    result += a['key'] + 'has bad type' + a + '\n'
+            db_error.insert('errors', query=name, result=result, t=web.SQLLiteral("now()"))
+        seen = set()
+        authors = [walk_redirects(a, seen) for a in authors if a['key'] not in seen]
+    return authors
+
+def do_flip(author):
+    # given an author name flip it in place
+    if 'personal_name' not in author:
+        return
+    if author['personal_name'] != author['name']:
+        return
+    first_comma = author['name'].find(', ')
+    if first_comma == -1:
+        return
+    # e.g: Harper, John Murdoch, 1845-
+    if author['name'].find(',', first_comma + 1) != -1:
+        return
+    if author['name'].find('i.e.') != -1:
+        return
+    if author['name'].find('i. e.') != -1:
+        return
+    name = flip_name(author['name'])
+    author['name'] = name
+    author['personal_name'] = name
+
+def pick_from_matches(author, match):
+    maybe = []
+    if 'birth_date' in author and 'death_date' in author:
+        maybe = [m for m in match if 'birth_date' in m and 'death_date' in m]
+    elif 'date' in author:
+        maybe = [m for m in match if 'date' in m]
+    if not maybe:
+        maybe = match
+    if len(maybe) == 1:
+        return maybe[0]
+    return min(maybe, key=key_int)
+
+def find_entity(author):
+    name = author['name']
+    things = find_author(name)
+    if author['entity_type'] != 'person':
+        if not things:
+            return None
+        db_entity = things[0]
+#        if db_entity['type']['key'] == '/type/redirect':
+#            db_entity = withKey(db_entity['location'])
+        assert db_entity['type'] == '/type/author'
+        return db_entity
+    if ', ' in name:
+        things += find_author(flip_name(name))
+    match = []
+    seen = set()
+    for a in things:
+        key = a['key']
+        if key in seen:
+            continue
+        seen.add(key)
+        orig_key = key
+        assert a['type'] == '/type/author'
+        if 'birth_date' in author and 'birth_date' not in a:
+            continue
+        if 'birth_date' not in author and 'birth_date' in a:
+            continue
+        if not author_dates_match(author, a):
+            continue
+        match.append(a)
+    if not match:
+        return None
+    if len(match) == 1:
+        return match[0]
+    try:
+        return pick_from_matches(author, match)
+    except ValueError:
+        print('author:', author)
+        print('match:', match)
+        raise
+
+def import_author(author, eastern=False):
+    existing = find_entity(author)
+    if existing:
+        assert existing['type'] == '/type/author'
+        for k in 'last_modified', 'id', 'revision', 'created':
+            if k in existing:
+                del existing[k]
+        new = existing
+        if 'death_date' in author and 'death_date' not in existing:
+            new['death_date'] = {
+                'connect': 'update',
+                'value': author['death_date'],
+            }
+        return new
+    else:
+        if not eastern:
+            do_flip(author)
+        a = {
+#            'create': 'unless_exists',
+            'type': { 'key': '/type/author' },
+            'name': author['name']
+        }
+        for f in 'title', 'personal_name', 'enumeration', 'birth_date', 'death_date', 'date':
+            if f in author:
+                a[f] = author[f]
+        return a
+
+type_map = {
+    'description': 'text',
+    'notes': 'text',
+    'number_of_pages': 'int',
+}
+
+def east_in_by_statement(rec):
+    if 'by_statement' not in rec:
+        return False
+    if 'authors' not in rec:
+        return False
+    name = rec['authors'][0]['name']
+    flipped = flip_name(name)
+    name = name.replace('.', '')
+    name = name.replace(', ', '')
+    if name == flipped.replace('.', ''):
+        return False
+    return rec['by_statement'].find(name) != -1
+
+def check_if_loaded(loc): # unused
+    return bool(get_versions({'machine_comment': loc}))
+
+# {'publishers': [u'D. Obradovi'], 'pagination': u'204p.', 'source_records': [u'ia:zadovoljstvauivo00lubb'], 'title': u'Zadovoljstva u ivotu', 'series': [u'Srpska knjiecna zadruga.  [Izdanja] 133'], 'number_of_pages': {'type': '/type/int', 'value': 204}, 'languages': [{'key': '/languages/ser'}], 'lc_classifications': [u'BJ1571 A819 1910'], 'publish_date': '1910', 'authors': [{'key': '/authors/OL162549A'}], 'ocaid': u'zadovoljstvauivo00lubb', 'publish_places': [u'Beograd'], 'type': {'key': '/type/edition'}}
+
+def build_query(loc, rec):
+    if 'table_of_contents' in rec:
+        assert not isinstance(rec['table_of_contents'][0], list)
+    book = {
+        'type': { 'key': '/type/edition'},
+    }
+
+    east = east_in_by_statement(rec)
+    if east:
+        print(rec)
+
+    langs = rec.get('languages', [])
+    print(langs)
+    if any(l['key'] == '/languages/zxx' for l in langs):
+        print('zxx found in langs')
+        rec['languages'] = [l for l in langs if l['key'] != '/languages/zxx']
+        print('fixed:', langs)
+
+    for l in rec.get('languages', []):
+        print(l)
+        if l['key'] == '/languages/ser':
+            l['key'] = '/languages/srp'
+        if l['key'] in ('/languages/end', '/languages/enk', '/languages/ent', '/languages/enb'):
+            l['key'] = '/languages/eng'
+        if l['key'] == '/languages/emg':
+            l['key'] = '/languages/eng'
+        if l['key'] == '/languages/cro':
+            l['key'] = '/languages/chu'
+        if l['key'] == '/languages/jap':
+            l['key'] = '/languages/jpn'
+        if l['key'] == '/languages/fra':
+            l['key'] = '/languages/fre'
+        if l['key'] == '/languages/ila':
+            l['key'] = '/languages/ita'
+        if l['key'] == '/languages/gwr':
+            l['key'] = '/languages/ger'
+        if l['key'] == '/languages/fr ':
+            l['key'] = '/languages/fre'
+        if l['key'] == '/languages/it ':
+            l['key'] = '/languages/ita'
+        if l['key'] == '/languages/fle': # flemish -> dutch
+            l['key'] = '/languages/dut'
+        assert withKey(l['key'])
+
+    for k, v in rec.iteritems():
+        if k == 'authors':
+            book[k] = [import_author(v[0], eastern=east)]
+            continue
+        if k in type_map:
+            t = '/type/' + type_map[k]
+            if isinstance(v, list):
+                book[k] = [{'type': t, 'value': i} for i in v]
+            else:
+                book[k] = {'type': t, 'value': v}
+        else:
+            book[k] = v
+
+    assert 'title' in book
+    return book
diff --git a/ia-legacy-importer/importer/load_cornell.py b/ia-legacy-importer/importer/load_cornell.py
new file mode 100644
index 00000000..ec19d6ad
--- /dev/null
+++ b/ia-legacy-importer/importer/load_cornell.py
@@ -0,0 +1,198 @@
+from __future__ import print_function
+import web
+import re
+import httplib
+import sys
+import simplejson as json
+import openlibrary.catalog.importer.pool as pool
+from openlibrary.catalog.merge.merge_marc import build_marc
+from openlibrary.catalog.read_rc import read_rc
+from openlibrary.catalog.importer.load import build_query, east_in_by_statement, import_author
+from openlibrary.catalog.utils.query import query, withKey
+from openlibrary.catalog.importer.merge import try_merge
+from openlibrary.catalog.importer.lang import add_lang
+from openlibrary.catalog.importer.update import add_source_records
+from openlibrary.catalog.get_ia import get_ia, urlopen_keep_trying, NoMARCXML
+from openlibrary.catalog.importer.db_read import get_mc
+import openlibrary.catalog.marc.parse_xml as parse_xml
+from time import time, sleep
+import openlibrary.catalog.marc.fast_parse as fast_parse
+sys.path.append('/home/edward/src/olapi')
+from olapi import OpenLibrary, unmarshal
+from six.moves import urllib
+
+import six
+
+
+rc = read_rc()
+ol = OpenLibrary("http://openlibrary.org")
+ol.login('ImportBot', rc['ImportBot'])
+
+db_amazon = web.database(dbn='postgres', db='amazon')
+db_amazon.printing = False
+
+db = web.database(dbn='mysql', host=rc['ia_db_host'], user=rc['ia_db_user'], \
+        passwd=rc['ia_db_pass'], db='archive')
+db.printing = False
+
+start = '2009-10-11 22:04:57'
+fh_log = open('/1/edward/logs/load_scribe', 'a')
+
+t0 = time()
+t_prev = time()
+rec_no = 0
+chunk = 50
+load_count = 0
+
+def read_short_title(title):
+    return str(fast_parse.normalize_str(title)[:25])
+
+def make_index_fields(rec):
+    fields = {}
+    for k, v in rec.iteritems():
+        if k in ('lccn', 'oclc', 'isbn'):
+            fields[k] = v
+            continue
+        if k == 'full_title':
+            fields['title'] = [read_short_title(v)]
+    return fields
+
+archive_url = "http://archive.org/download/"
+
+def load(loc, ia):
+    print("load", loc, ia)
+    url = archive_url + loc
+    f = urlopen_keep_trying(url)
+    try:
+        edition = parse_xml.parse(f)
+    except AssertionError:
+        return
+    except parse_xml.BadSubtag:
+        return
+    except KeyError:
+        return
+    if 'title' not in edition:
+        return
+    edition['ocaid'] = ia
+    write_edition("ia:" + ia, edition)
+
+def write_edition(loc, edition):
+    add_lang(edition)
+    q = build_query(loc, edition)
+    authors = []
+    for a in q.get('authors', []):
+        if 'key' in a:
+            authors.append({'key': a['key']})
+        else:
+            try:
+                ret = ol.new(a, comment='new author')
+            except:
+                print(a)
+                raise
+            print('ret:', ret)
+            assert isinstance(ret, six.string_types)
+            authors.append({'key': ret})
+    q['source_records'] = [loc]
+    if authors:
+        q['authors'] = authors
+
+    for attempt in range(50):
+        if attempt > 0:
+            print('retrying')
+        try:
+            ret = ol.new(q, comment='initial import')
+        except httplib.BadStatusLine:
+            sleep(30)
+            continue
+        except: # httplib.BadStatusLine
+            print(q)
+            raise
+        break
+    print('ret:', ret)
+    assert isinstance(ret, six.string_types)
+    key = ret
+    pool.update(key, q)
+
+def write_log(ia, when, msg):
+    #print >> fh_log, (ia, when, msg)
+    print((ia, when, msg))
+    fh_log.flush()
+
+#iter = db.query("select identifier, updated from metadata where scanner is not null and noindex is null and mediatype='texts' and (curatestate='approved' or curatestate is null) and scandate is not null and updated > $start order by updated", {'start': start})
+iter = db.query("select identifier, updated from metadata where contributor='Cornell University Library' and scanner is not null and noindex is null and mediatype='texts' and (curatestate='approved' or curatestate is null) and scandate is not null order by updated", {'start': start})
+t_start = time()
+for row in iter:
+    ia = row.identifier
+    print((repr(ia), row.updated))
+    when = str(row.updated)
+    if query({'type': '/type/edition', 'ocaid': ia}):
+        print('already loaded')
+        continue
+    if query({'type': '/type/edition', 'source_records': 'ia:' + ia}):
+        print('already loaded')
+        continue
+    try:
+        loc, rec = get_ia(ia)
+    except (KeyboardInterrupt, NameError):
+        raise
+    except NoMARCXML:
+        write_log(ia, when, "no MARCXML")
+        continue
+    except urllib.error.HTTPError as error:
+        write_log(ia, when, "error: HTTPError: " + str(error))
+        continue
+    if loc is None:
+        write_log(ia, when, "error: no loc ")
+    if rec is None:
+        write_log(ia, when, "error: no rec")
+        continue
+    print(loc, rec)
+
+    if not loc.endswith('.xml'):
+        print("not XML")
+        write_log(ia, when, "error: not XML")
+        continue
+    if 'full_title' not in rec:
+        print("full_title missing")
+        write_log(ia, when, "error: full_title missing")
+        continue
+    index_fields = make_index_fields(rec)
+    if not index_fields:
+        print("no index_fields")
+        write_log(ia, when, "error: no index fields")
+        continue
+
+    edition_pool = pool.build(index_fields)
+
+    if not edition_pool:
+        load(loc, ia)
+        write_log(ia, when, "loaded")
+        continue
+
+    e1 = build_marc(rec)
+
+    match = False
+    seen = set()
+    for k, v in edition_pool.iteritems():
+        for edition_key in v:
+            if edition_key in seen:
+                continue
+            thing = None
+            while not thing or thing['type']['key'] == '/type/redirect':
+                seen.add(edition_key)
+                thing = withKey(edition_key)
+                assert thing
+                if thing['type']['key'] == '/type/redirect':
+                    print('following redirect %s => %s' % (edition_key, thing['location']))
+                    edition_key = thing['location']
+            if try_merge(e1, edition_key, thing):
+                add_source_records(edition_key, ia)
+                write_log(ia, when, "found match: " + edition_key)
+                match = True
+                break
+        if match:
+            break
+
+    if not match:
+        load(loc, ia)
+        write_log(ia, when, "loaded")
diff --git a/ia-legacy-importer/importer/load_scribe.py b/ia-legacy-importer/importer/load_scribe.py
new file mode 100755
index 00000000..9a2c1d69
--- /dev/null
+++ b/ia-legacy-importer/importer/load_scribe.py
@@ -0,0 +1,511 @@
+from __future__ import print_function
+import os
+import web
+import re
+import httplib
+import sys
+import threading
+import simplejson as json
+from lxml import etree
+import openlibrary.catalog.importer.pool as pool
+from openlibrary.catalog.marc.marc_xml import read_marc_file, MarcXml, BlankTag, BadSubtag
+from openlibrary.catalog.marc.marc_binary import MarcBinary
+from openlibrary.catalog.merge.merge_marc import build_marc
+from openlibrary.catalog.importer.load import build_query, east_in_by_statement
+from openlibrary.catalog.utils import error_mail
+from openlibrary.catalog.utils.query import query, withKey
+from openlibrary.catalog.importer.merge import try_merge
+from openlibrary.catalog.importer.update import add_source_records
+from openlibrary.catalog.get_ia import get_ia, urlopen_keep_trying, NoMARCXML, bad_ia_xml, marc_formats, get_marc_ia_data
+from openlibrary.catalog.title_page_img.load import add_cover_image
+from openlibrary.solr.update_work import update_work, solr_update
+from openlibrary.catalog.works.find_work_for_edition import find_matching_work
+from openlibrary.catalog.marc import fast_parse, is_display_marc
+from openlibrary.catalog.marc.parse import read_edition, NoTitle
+from openlibrary.catalog.marc.marc_subject import subjects_for_work
+from openlibrary.utils.ia import find_item
+from openlibrary import config
+from time import time, sleep
+from openlibrary.api import OpenLibrary
+from subprocess import Popen, PIPE
+import argparse
+
+import six
+from six.moves import urllib
+
+
+parser = argparse.ArgumentParser(description='scribe loader')
+parser.add_argument('--skip_hide_books', action='store_true')
+parser.add_argument('--item_id')
+parser.add_argument('--config', default='openlibrary.yml')
+args = parser.parse_args()
+
+config_file = args.config
+config.load(config_file)
+import_bot_password = config.runtime_config['load_scribe']['import_bot_password']
+# '/1/var/log/openlibrary/load_scribe'
+load_scribe_log = config.runtime_config['load_scribe']['log']
+
+ol = OpenLibrary("http://openlibrary.org")
+ol.login('ImportBot', import_bot_password)
+
+password = Popen(["/opt/.petabox/dbserver"], stdout=PIPE).communicate()[0]
+db = web.database(dbn='mysql', host='dbmeta.us.archive.org', user='archive', \
+        passwd=password, db='archive')
+db.printing = False
+
+re_census = re.compile('^\d+(st|nd|rd|th)census')
+
+re_edition_key = re.compile('^/(?:books|b)/(OL\d+M)$')
+
+def read_short_title(title):
+    return str(fast_parse.normalize_str(title)[:25])
+
+def make_index_fields(rec):
+    fields = {}
+    for k, v in rec.iteritems():
+        if k in ('lccn', 'oclc', 'isbn'):
+            fields[k] = v
+            continue
+        if k == 'full_title':
+            fields['title'] = [read_short_title(v)]
+    return fields
+
+def load_binary(ia, host, path):
+    url = 'http://' + host + path + '/' + ia + '_meta.mrc'
+    print(url)
+    f = urlopen_keep_trying(url)
+    data = f.read()
+    assert '<title>Internet Archive: Page Not Found</title>' not in data[:200]
+    if len(data) != int(data[:5]):
+        data = data.decode('utf-8').encode('raw_unicode_escape')
+    assert len(data) == int(data[:5])
+    return MarcBinary(data)
+
+def load_xml(ia, host, path):
+    url = 'http://' + host + path + '/' + ia + '_marc.xml'
+    print(url)
+    f = urlopen_keep_trying(url)
+    root = etree.parse(f).getroot()
+    if root.tag == '{http://www.loc.gov/MARC21/slim}collection':
+        root = root[0]
+    return MarcXml(root)
+    edition = read_edition(rec)
+    assert 'title' in edition
+    return edition
+
+def load(ia, use_binary=False):
+    print("load", ia)
+    if not use_binary:
+        try:
+            rec = load_xml(ia, host, path)
+            edition = read_edition(rec)
+        except BadSubtag:
+            use_binary = True
+        except BlankTag:
+            use_binary = True
+    if use_binary:
+        rec = load_binary(ia, host, path)
+        edition = read_edition(rec)
+    assert 'title' in edition
+
+    edition['ocaid'] = ia
+    write_edition(ia, edition, rec)
+
+def write_edition(ia, edition, rec):
+    loc = 'ia:' + ia
+    if ia == 'munkai00apor':
+        edition['languages'] = [
+            {'key': '/languages/lat'},
+            {'key': '/languages/hun'},
+        ]
+    elif ia == 'fzfasp00helt':
+        edition['languages'] = [{'key': '/languages/hun'}]
+    elif ia == 'coursetconfren00sema':
+        edition['languages'] = [{'key': '/languages/fre'}]
+    elif ia == 'repertoiredepein02rein':
+        edition['languages'] = [{'key': '/languages/fre'}]
+    elif ia == 'repertoiredepein01rein':
+        edition['languages'] = [{'key': '/languages/fre'}]
+    elif ia == 'cihm_39338':
+        edition['languages'] = [{'key': '/languages/ger'}]
+    elif ia == 'ofilhoprdigodr00mano':
+        edition['languages'] = [{'key': '/languages/por'}]
+    elif ia == 'nekaroronneteyer00hill':
+        edition['languages'] = [{'key': '/languages/moh'}]
+    elif ia == 'adventuresofamer00kouw':
+        edition['languages'] = [{'key': '/languages/eng'}]
+    elif ia == 'goldentreasury00wrig':
+        edition['languages'] = [{'key': '/languages/grc'}]
+    elif ia == 'dasrmischepriv00rein':
+        edition['languages'] = [{'key': '/languages/ger'}]
+    elif ia == 'lespritdelaligu02anqu':
+        edition['languages'] = [{'key': '/languages/fre'}]
+    elif ia == 'derelephantenord00berl':
+        del edition['languages']
+    q = build_query(loc, edition)
+    authors = []
+    for a in q.get('authors', []):
+        if 'key' in a:
+            authors.append({'key': a['key']})
+        else:
+            try:
+                ret = ol.new(a, comment='new author')
+            except:
+                print(a)
+                raise
+            print('ret:', ret)
+            assert isinstance(ret, six.string_types)
+            authors.append({'key': ret})
+    q['source_records'] = [loc]
+    if authors:
+        q['authors'] = authors
+
+    wkey = None
+    subjects = subjects_for_work(rec)
+    subjects.setdefault('subjects', []).append('Accessible book')
+
+    if 'printdisabled' in collections:
+        subjects['subjects'].append('Protected DAISY')
+    elif 'lendinglibrary' in collections:
+        subjects['subjects'] += ['Protected DAISY', 'Lending library']
+    elif 'inlibrary' in collections:
+        subjects['subjects'] += ['Protected DAISY', 'In library']
+
+    if 'authors' in q:
+        wkey = find_matching_work(q)
+    if wkey:
+        w = ol.get(wkey)
+        need_update = False
+        for k, subject_list in subjects.items():
+            for s in subject_list:
+                if s not in w.get(k, []):
+                    w.setdefault(k, []).append(s)
+                    need_update = True
+        if need_update:
+            ol.save(wkey, w, 'add subjects from new record')
+    else:
+        w = {
+            'type': '/type/work',
+            'title': q['title'],
+        }
+        if 'authors' in q:
+            w['authors'] = [{'type':'/type/author_role', 'author': akey} for akey in q['authors']]
+        w.update(subjects)
+
+        wkey = ol.new(w, comment='initial import')
+
+    q['works'] = [{'key': wkey}]
+    for attempt in range(50):
+        if attempt > 0:
+            print('retrying')
+        try:
+            ret = ol.new(q, comment='initial import')
+        except httplib.BadStatusLine:
+            sleep(30)
+            continue
+        except: # httplib.BadStatusLine
+            print(q)
+            raise
+        break
+    print('ret:', ret)
+    assert isinstance(ret, six.string_types)
+    key = '/b/' + re_edition_key.match(ret).group(1)
+    pool.update(key, q)
+
+    print('add_cover_image')
+    t = threading.Thread(target=add_cover_image, args=(ret, ia))
+    t.start()
+    return
+
+    print('run work finder')
+
+fh_log = None
+
+def write_log(ia, when, msg):
+    print((ia, when, msg), file=fh_log)
+    fh_log.flush()
+
+hide_state_file = config.runtime_config['state_dir'] + '/load_scribe_hide'
+ignore_noindex = set(['printdisabled', 'lendinglibrary', 'inlibrary'])
+
+def hide_books(start):
+    hide_start = open(hide_state_file).readline()[:-1]
+    print('hide start:', hide_start)
+
+    mend = []
+    fix_works = set()
+    db_iter = db.query("select identifier, collection, updated from metadata where (noindex is not null or curatestate='dark') and mediatype='texts' and scandate is not null and updated > $start", {'start': hide_start})
+    last_updated = None
+    for row in db_iter:
+        ia = row.identifier
+        if row.collection:
+            collections = set(i.lower().strip() for i in row.collection.split(';'))
+            if ignore_noindex & collections:
+                continue
+        print((repr(ia), row.updated))
+        for eq in query({'type': '/type/edition', 'ocaid': ia}):
+            print(eq['key'])
+            e = ol.get(eq['key'])
+            if 'ocaid' not in e:
+                continue
+            if 'works' in e:
+                fix_works.update(e['works'])
+            print((e['key'], repr(e.get('title', None))))
+            del e['ocaid']
+            mend.append(e)
+        last_updated = row.updated
+    print('removing links from %d editions' % len(mend))
+    if not mend:
+        return
+    print(ol.save_many(mend, 'remove link'))
+    requests = []
+    for wkey in fix_works:
+        requests += update_work(withKey(wkey))
+    if fix_works:
+        solr_update(requests + ['<commit/>'], debug=True)
+    print(last_updated, file=open(hide_state_file, 'w'))
+
+def load_error_mail(ia, marc_display, subject):
+    msg_from = 'load_scribe@archive.org'
+    msg_to = ['edward@archive.org']
+    subject += ': ' + ia
+    msg = 'http://www.archive.org/details/%s\n' % ia
+    msg += 'http://www.archive.org/download/%s\n'
+    msg += '\n' + bad_binary
+    error_mail(msg_from, msg_to, subject, msg)
+
+def error_marc_403(ia):
+    msg_from = 'load_scribe@archive.org'
+    msg_to = ['edward@archive.org']
+    msg = 'http://www.archive.org/details/' + ia
+    subject = 'MARC 403: ' + ia
+    error_mail(msg_from, msg_to, subject, msg)
+
+def bad_marc_alert(bad_marc):
+    assert bad_marc
+    msg_from = 'load_scribe@archive.org'
+    msg_to = ['edward@archive.org']
+    subject = '%d bad MARC' % len(bad_marc)
+    msg = '\n'.join((
+        'http://www.archive.org/details/%s\n' +
+        'http://www.archive.org/download/%s\n\n' +
+        '%s\n\n') % (ia, ia, repr(data)) for ia, data in bad_marc)
+    error_mail(msg_from, msg_to, subject, msg)
+
+if __name__ == '__main__':
+    fh_log = open(load_scribe_log, 'a')
+
+    open(config.runtime_config['state_dir'] + '/load_scribe.pid', 'w').write(os.getpid())
+    start = open(state_file).readline()[:-1]
+    bad_marc_last_sent = time()
+    bad_marc = []
+
+    while True:
+
+        if args.item_id:
+            db_iter = db.query("select identifier, contributor, updated, noindex, collection, format from metadata where scanner is not null and mediatype='texts' and (not curatestate='dark' or curatestate is null) and scandate is not null and format is not null and identifier=$item_id", {'item_id': args.item_id})
+        else:
+            print('start:', start)
+            db_iter = db.query("select identifier, contributor, updated, noindex, collection, format from metadata where scanner is not null and mediatype='texts' and (not curatestate='dark' or curatestate is null) and scandate is not null and format is not null and updated between $start and date_add($start, interval 2 day) order by updated", {'start': start})
+        t_start = time()
+        for row in db_iter:
+            if len(bad_marc) > 10 or (bad_marc and time() - bad_marc_last_sent > (4 * 60 * 60)):
+                bad_marc_alert(bad_marc)
+                bad_marc = []
+                bad_marc_last_sent = time()
+
+            ia = row.identifier
+            host, path = find_item(ia)
+            if 'pdf' not in row.format.lower():
+                continue # scancenter and billing staff often use format like "%pdf%" as a proxy for having derived
+            if row.contributor == 'Allen County Public Library Genealogy Center':
+                print('skipping Allen County Public Library Genealogy Center')
+                continue
+            if row.collection:
+                collections = set(i.lower().strip() for i in row.collection.split(';'))
+            else:
+                collections = set()
+            if row.noindex:
+                if not row.collection:
+                    continue
+                collections = set(i.lower().strip() for i in row.collection.split(';'))
+                if not ignore_noindex & collections:
+                    continue
+            if ia.startswith('annualreportspri'):
+                print('skipping:', ia)
+                continue
+            if 'shenzhentest' in collections:
+                continue
+
+            if any('census' in c for c in collections):
+                print('skipping census')
+                continue
+
+            if re_census.match(ia) or ia.startswith('populationschedu') or ia.startswith('michigancensus') or 'census00reel' in ia or ia.startswith('populationsc1880'):
+                print('ia:', ia)
+                print('collections:', list(collections))
+                print('census not marked correctly')
+                continue
+            assert 'passportapplicat' not in ia and 'passengerlistsof' not in ia
+            if 'passportapplicat' in ia:
+                print('skip passport applications for now:', ia)
+                continue
+            if 'passengerlistsof' in ia:
+                print('skip passenger lists', ia)
+                continue
+            print((repr(ia), row.updated))
+            when = str(row.updated)
+            if query({'type': '/type/edition', 'ocaid': ia}):
+                print('already loaded')
+                continue
+            if query({'type': '/type/edition', 'source_records': 'ia:' + ia}):
+                print('already loaded')
+                continue
+
+            try:
+                formats = marc_formats(ia, host, path)
+            except urllib.error.HTTPError as error:
+                write_log(ia, when, "error: HTTPError: " + str(error))
+                continue
+            use_binary = False
+            bad_binary = None
+            print(formats)
+            rec = {}
+            if formats['bin']:
+                print('binary')
+                use_binary = True
+                try:
+                    marc_data = get_marc_ia_data(ia, host, path)
+                except urllib.error.HTTPError as error:
+                    if error.code == 403:
+                        error_marc_403(ia)
+                        continue
+                    raise
+                if marc_data == '':
+                    bad_binary = 'MARC binary empty string'
+                if not bad_binary and is_display_marc(marc_data):
+                    use_binary = False
+                    bad_binary = marc_data
+                    bad_marc.append((ia, marc_data))
+                if not bad_binary:
+                    try:
+                        length = int(marc_data[0:5])
+                    except ValueError:
+                        bad_binary = "MARC doesn't start with number"
+                if not bad_binary and len(marc_data) != length:
+                    try:
+                        marc_marc_data = marc_data.decode('utf-8').encode('raw_unicode_escape')
+                    except:
+                        bad_binary = "double UTF-8 decode error"
+                if not bad_binary and len(marc_data) != length:
+                    bad_binary = 'MARC length mismatch: %d != %d' % (len(marc_data), length)
+                if not bad_binary and 'Internet Archive: Error' in marc_data:
+                    bad_binary = 'Internet Archive: Error'
+                if not bad_binary:
+                    if str(marc_data)[6:8] != 'am': # only want books
+                        print('not a book!')
+                        continue
+                    try:
+                        rec = fast_parse.read_edition(marc_data, accept_electronic = True)
+                    except:
+                        bad_binary = "MARC parse error"
+            if bad_binary and not formats['xml']:
+                load_error_mail(ia, bad_binary, 'bad MARC binary, no MARC XML')
+                continue
+            if not use_binary and formats['xml']:
+                if bad_ia_xml(ia) and bad_binary:
+                    load_error_mail(ia, bad_binary, 'bad MARC binary, bad MARC XML')
+                    continue
+                try:
+                    rec = get_ia(ia)
+                except (KeyboardInterrupt, NameError):
+                    raise
+                except NoMARCXML:
+                    write_log(ia, when, "no MARCXML")
+                    continue
+                except urllib.error.HTTPError as error:
+                    write_log(ia, when, "error: HTTPError: " + str(error))
+                    continue
+            if not use_binary and not formats['xml']:
+                print('skipping, no MARC')
+                continue
+
+            if not rec:
+                write_log(ia, when, "error: no rec")
+                continue
+            if 'physical_format' in rec:
+                format = rec['physical_format'].lower()
+                if format.startswith('[graphic') or format.startswith('[cartograph'):
+                    continue
+            print(rec)
+
+            if 'full_title' not in rec:
+                print("full_title missing")
+                write_log(ia, when, "error: full_title missing")
+                continue
+            index_fields = make_index_fields(rec)
+            if not index_fields:
+                print("no index_fields")
+                write_log(ia, when, "error: no index fields")
+                continue
+
+            edition_pool = pool.build(index_fields)
+
+            if not edition_pool:
+                load(ia, use_binary=use_binary)
+                write_log(ia, when, "loaded")
+                continue
+
+            e1 = build_marc(rec)
+
+            match = False
+            seen = set()
+            for k, v in edition_pool.iteritems():
+                for edition_key in v:
+                    if edition_key in seen:
+                        continue
+                    thing = None
+                    found = True
+                    while not thing or thing['type']['key'] == '/type/redirect':
+                        seen.add(edition_key)
+                        thing = withKey(edition_key)
+                        assert thing
+                        if 'type' not in thing:
+                            print(thing)
+                        if thing.get('error') == 'notfound':
+                            found = False
+                            break
+                        if thing['type']['key'] == '/type/redirect':
+                            print('following redirect %s => %s' % (edition_key, thing['location']))
+                            edition_key = thing['location']
+                    if not found:
+                        continue
+                    if try_merge(e1, edition_key, thing):
+                        add_source_records(edition_key, ia)
+                        write_log(ia, when, "found match: " + edition_key)
+                        match = True
+                        break
+                if match:
+                    break
+
+            if not match:
+                try:
+                    load(ia, use_binary=use_binary)
+                except:
+                    print('bad item:', ia)
+                    raise
+                write_log(ia, when, "loaded")
+            print(row.updated, file=open(state_file, 'w'))
+        start = row.updated
+        secs = time() - t_start
+        mins = secs / 60
+        print("finished %d took mins" % mins)
+        if args.item_id:
+            break
+        if not args.skip_hide_books:
+            hide_books(start)
+        print(start, file=open(state_file, 'w'))
+        if mins < 30:
+            print('waiting')
+            sleep(60 * 30 - secs)
diff --git a/ia-legacy-importer/importer/merge.py b/ia-legacy-importer/importer/merge.py
new file mode 100644
index 00000000..bc093b7d
--- /dev/null
+++ b/ia-legacy-importer/importer/merge.py
@@ -0,0 +1,244 @@
+from __future__ import print_function
+from openlibrary.catalog.merge.merge_marc import *
+from openlibrary.catalog.read_rc import read_rc
+import openlibrary.catalog.merge.amazon as amazon
+from openlibrary.catalog.get_ia import *
+from openlibrary.catalog.importer.db_read import withKey, get_mc
+from openlibrary.api import OpenLibrary, Reference
+import openlibrary.catalog.marc.fast_parse as fast_parse
+import xml.parsers.expat
+import web
+import sys
+from time import sleep
+
+import six
+
+
+rc = read_rc()
+
+ol = OpenLibrary("http://openlibrary.org")
+ol.login('ImportBot', rc['ImportBot'])
+
+ia_db = web.database(dbn='mysql', db='archive', user=rc['ia_db_user'], pw=rc['ia_db_pass'], host=rc['ia_db_host'])
+ia_db.printing = False
+
+re_meta_marc = re.compile('([^/]+)_(meta|marc)\.(mrc|xml)')
+
+threshold = 875
+amazon.set_isbn_match(225)
+
+def try_amazon(thing):
+    if 'isbn_10' not in thing:
+        return None
+    if 'authors' in thing:
+        authors = []
+        for a in thing['authors']:
+            # this is a hack
+            # the type of thing['authors'] should all be the same type
+            if isinstance(a, dict):
+                akey = a['key']
+            else:
+                assert isinstance(a, six.string_types)
+                akey = a
+            author_thing = withKey(akey)
+            if 'name' in author_thing:
+                authors.append(author_thing['name'])
+    else:
+        authors = []
+    return amazon.build_amazon(thing, authors)
+
+def is_dark_or_bad(ia):
+    vars = { 'ia': ia }
+    db_iter = None
+    for attempt in range(5):
+        try:
+            db_iter = ia_db.query('select curatestate from metadata where identifier=$ia', vars)
+            break
+        except:
+            print('retry, attempt', attempt)
+            sleep(10)
+    if db_iter is None:
+        return False
+    rows = list(db_iter)
+    if len(rows) == 0:
+        return True
+    assert len(rows) == 1
+    return rows[0].curatestate == 'dark'
+
+def marc_match(e1, loc):
+    print('loc:', loc)
+    rec = fast_parse.read_edition(get_from_archive(loc))
+    print('rec:', rec)
+    try:
+        e2 = build_marc(rec)
+    except TypeError:
+        print(rec)
+        raise
+    return attempt_merge(e1, e2, threshold, debug=False)
+
+def ia_match(e1, ia):
+    try:
+        rec = get_ia(ia)
+    except NoMARCXML:
+        return False
+    except urllib2.HTTPError:
+        return False
+    if rec is None or 'full_title' not in rec:
+        return False
+    try:
+        e2 = build_marc(rec)
+    except TypeError:
+        print(rec)
+        raise
+    return attempt_merge(e1, e2, threshold, debug=False)
+
+def amazon_match(e1, thing):
+    try:
+        a = try_amazon(thing)
+    except IndexError:
+        print(thing['key'])
+        raise
+    except AttributeError:
+        return False
+    if not a:
+        return False
+    try:
+        return amazon.attempt_merge(a, e1, threshold, debug=False)
+    except:
+        print(a)
+        print(e1)
+        print(thing['key'])
+        raise
+
+def fix_source_records(key, thing):
+    if 'source_records' not in thing:
+        return False
+    src_rec = thing['source_records']
+    marc_ia = 'marc:ia:'
+    if not any(i.startswith(marc_ia) for i in src_rec):
+        return False
+    e = ol.get(key)
+    new = [i[5:] if i.startswith(marc_ia) else i for i in e['source_records']]
+    e['source_records'] = new
+    print(e['ocaid'])
+    print(e['source_records'])
+    assert 'ocaid' in e and ('ia:' + e['ocaid'] in e['source_records'])
+    print('fix source records')
+    print(ol.save(key, e, 'fix bad source records'))
+    return True
+
+def source_records_match(e1, thing):
+    marc = 'marc:'
+    amazon = 'amazon:'
+    ia = 'ia:'
+    match = False
+    for src in thing['source_records']:
+        if src == 'marc:initial import':
+            continue
+        # hippocrates01hippuoft/hippocrates01hippuoft_marc.xml
+        m = re_meta_marc.search(src)
+        if m:
+            src = 'ia:' + m.group(1)
+        if src.startswith(marc):
+            if marc_match(e1, src[len(marc):]):
+                match = True
+                break
+        elif src.startswith(ia):
+            if ia_match(e1, src[len(ia):]):
+                match = True
+                break
+        else:
+            assert src.startswith(amazon)
+            if amazon_match(e1, thing):
+                match = True
+                break
+    return match
+
+def try_merge(e1, edition_key, thing):
+    thing_type = thing['type']
+    if thing_type != Reference('/type/edition'):
+        print(thing['key'], 'is', str(thing['type']))
+    if thing_type == Reference('/type/delete'):
+        return False
+    assert thing_type == Reference('/type/edition')
+
+    if 'source_records' in thing:
+        if fix_source_records(edition_key, thing):
+            thing = withKey(edition_key) # reload
+        return source_records_match(e1, thing)
+
+    ia = thing.get('ocaid', None)
+    print(edition_key)
+    mc = get_mc(edition_key)
+    print(mc)
+    if mc:
+        if mc.startswith('ia:'):
+            ia = mc[3:]
+        elif mc.endswith('.xml') or mc.endswith('.mrc'):
+            ia = mc[:mc.find('/')]
+        if '_meta.mrc:' in mc:
+            print(thing)
+            if 'ocaid' not in thing:
+                return False
+            ia = thing['ocaid']
+    rec2 = None
+    if ia:
+        if is_dark_or_bad(ia):
+            return False
+        try:
+            rec2 = get_ia(ia)
+        except xml.parsers.expat.ExpatError:
+            return False
+        except NoMARCXML:
+            print('no MARCXML')
+            pass
+        except urllib2.HTTPError as error:
+            print(error.code)
+            assert error.code in (404, 403)
+        if not rec2:
+            return True
+    if not rec2:
+        if not mc:
+            mc = get_mc(thing['key'])
+        if not mc or mc == 'initial import':
+            return False
+        if mc.startswith('amazon:'):
+            try:
+                a = try_amazon(thing)
+            except IndexError:
+                print(thing['key'])
+                raise
+            except AttributeError:
+                return False
+            if not a:
+                return False
+            try:
+                return amazon.attempt_merge(a, e1, threshold, debug=False)
+            except:
+                print(a)
+                print(e1)
+                print(thing['key'])
+                raise
+        print('mc:', mc)
+        try:
+            assert not mc.startswith('ia:')
+            data = get_from_archive(mc)
+            if not data:
+                return True
+            rec2 = fast_parse.read_edition(data)
+        except (fast_parse.SoundRecording, IndexError, AssertionError):
+            print(mc)
+            print(edition_key)
+            return False
+        except:
+            print(mc)
+            print(edition_key)
+            raise
+    if not rec2:
+        return False
+    try:
+        e2 = build_marc(rec2)
+    except TypeError:
+        print(rec2)
+        raise
+    return attempt_merge(e1, e2, threshold, debug=False)
diff --git a/ia-legacy-importer/importer/olwrite.py b/ia-legacy-importer/importer/olwrite.py
new file mode 100644
index 00000000..9ad23f33
--- /dev/null
+++ b/ia-legacy-importer/importer/olwrite.py
@@ -0,0 +1,49 @@
+from __future__ import print_function
+import web
+from infogami.infobase import client
+import simplejson
+import sys
+
+web.ctx.ip = '127.0.0.1'
+
+class Infogami:
+    def __init__(self, host, sitename='openlibrary.org'):
+        self.conn = client.connect(type='remote', base_url=host)
+        self.sitename = sitename
+
+    def _request(self, path, method, data):
+        out = self.conn.request(self.sitename, path, method, data)
+        out = simplejson.loads(out)
+        if out['status'] == 'fail':
+            raise Exception(out['message'])
+        return out
+
+    def login(self, username, password):
+        return self._request('/account/login', 'POST', dict(username=username, password=password))
+
+    def write(self, query, comment='', machine_comment=None):
+        query = simplejson.dumps(query)
+        return self._request('/write', 'POST', dict(query=query, comment=comment, machine_comment=machine_comment))
+
+    def new_key(self, type):
+        return self._request('/new_key', 'GET', dict(type=type))['result']
+
+def add_to_database(infogami, q, loc):
+# sample return
+#    {'status': 'ok', 'result': {'updated': [], 'created': ['/b/OL13489313M']}}
+
+    for a in (i for i in q.get('authors', []) if 'key' not in i):
+        a['key'] = infogami.new_key('/type/author')
+
+    q['key'] = infogami.new_key('/type/edition')
+    ret = infogami.write(q, comment='initial import', machine_comment=loc)
+    assert ret['status'] == 'ok'
+    keys = [ i for i in ret['result']['created'] if i.startswith('/b/')]
+    try:
+        assert len(keys) == 1 or keys[0] == q['key']
+    except AssertionError:
+        print(q)
+        print(ret)
+        print(keys)
+        raise
+    return q['key']
diff --git a/ia-legacy-importer/importer/pool.py b/ia-legacy-importer/importer/pool.py
new file mode 100644
index 00000000..ffc33b02
--- /dev/null
+++ b/ia-legacy-importer/importer/pool.py
@@ -0,0 +1,55 @@
+from __future__ import print_function
+import simplejson as json
+import web
+from openlibrary.catalog.merge.merge_index import add_to_indexes
+
+# need to use multiple databases
+# use psycopg2 until open library is upgraded to web 3.0
+
+import psycopg2
+from openlibrary.catalog.read_rc import read_rc
+
+from six.moves.urllib.request import urlopen, Request
+
+
+conn = psycopg2.connect(database='marc_index', host='ol-db')
+cur = conn.cursor()
+
+pool_url = 'http://0.0.0.0:9020/'
+
+db_fields = ('isbn', 'title', 'oclc', 'lccn')
+
+def build(index_fields):
+    pool = {}
+    for field in db_fields:
+        if not field in index_fields:
+            continue
+        for v in index_fields[field]:
+            if field == 'isbn' and len(v) < 10:
+                continue
+            cur.execute('select k from ' + field + ' where v=%(v)s', {'v': v})
+            pool.setdefault(field, set()).update(i[0] for i in cur.fetchall())
+    return dict((k, sorted(v)) for k, v in pool.iteritems())
+
+def update(key, q):
+    seen = set()
+    for field, value in add_to_indexes(q):
+        vars = {'key': key, 'value': value }
+        if (field, value) in seen:
+            print((key, field, value))
+            print(seen)
+            print(q)
+        if (field, value) in seen:
+            continue
+        seen.add((field, value))
+        cur.execute('insert into ' + field + ' (k, v) values (%(key)s, %(value)s)', vars)
+
+def post_progress(archive_id, q):
+    url = pool_url + "store/" + archive_id
+    req = Request(url, json.dumps(q))
+    urlopen(req).read()
+
+def get_start(archive_id):
+    url = pool_url + "store/" + archive_id
+    data = urlopen(url).read()
+    return json.loads(data)
diff --git a/ia-legacy-importer/importer/scribe.py b/ia-legacy-importer/importer/scribe.py
new file mode 100644
index 00000000..eb1c6d08
--- /dev/null
+++ b/ia-legacy-importer/importer/scribe.py
@@ -0,0 +1,301 @@
+#!/usr/bin/python
+from __future__ import print_function
+from subprocess import Popen, PIPE
+from openlibrary.utils.ia import find_item, FindItemError
+from openlibrary.api import OpenLibrary
+from openlibrary.catalog.read_rc import read_rc
+from openlibrary.catalog.get_ia import marc_formats, get_marc_ia_data
+from openlibrary.catalog.marc import is_display_marc
+from time import sleep, time
+
+import MySQLdb
+import re
+import httplib
+import json
+import codecs
+import socket
+import sys
+
+from six.moves import urllib
+
+
+ol = OpenLibrary('http://openlibrary.org/')
+
+rc = read_rc()
+
+base_url = 'http://openlibrary.org'
+
+ia_db_host = 'dbmeta.us.archive.org'
+ia_db_user = 'archive'
+ia_db_pass = Popen(["/opt/.petabox/dbserver"], stdout=PIPE).communicate()[0]
+
+re_census = re.compile('^\d+(st|nd|rd|th)census')
+
+fields = ['identifier', 'contributor', 'updated', 'noindex', 'collection', 'format', 'boxid']
+sql_fields = ', '.join(fields)
+
+scanned_start = open('scanned_start').readline()[:-1]
+
+ignore_noindex = set(['printdisabled', 'lendinglibrary', 'inlibrary'])
+
+def login(h1):
+    body = json.dumps({'username': 'ImportBot', 'password': rc['ImportBot']})
+    headers = {'Content-Type': 'application/json'}
+    h1.request('POST', base_url + '/account/login', body, headers)
+    print(base_url + '/account/login')
+    res = h1.getresponse()
+
+    print(res.read())
+    print('status:', res.status)
+    assert res.status == 200
+    cookies = res.getheader('set-cookie').split(',')
+    cookie =  ';'.join([c.split(';')[0] for c in cookies])
+    return cookie
+
+h1 = httplib.HTTPConnection('openlibrary.org')
+h1.set_debuglevel(1)
+cookie = login(h1)
+h1.close()
+
+bad = open('bad_import', 'a')
+bad_lang = open('bad_lang', 'a')
+logfile = open('log', 'a')
+logfile.flush()
+
+class BadImport (Exception):
+    pass
+
+class BadLang (Exception):
+    pass
+
+import_api_url = base_url + '/api/import'
+def post_to_import_api(ia, marc_data, contenttype, subjects = [], boxid = None, scanned=True):
+    print("POST to /api/import:", (ia, len(marc_data)))
+
+    cover_url = 'http://www.archive.org/download/' + ia + '/page/' + ia + '_preview.jpg'
+
+    headers = {
+        'Content-type': contenttype,
+        'Cookie': cookie,
+        'x-archive-meta-source-record': 'ia:' + ia,
+    }
+    if scanned:
+        headers['x-archive-meta-cover'] = cover_url
+        headers['x-archive-meta-ocaid'] = ia
+    else:
+        headers['x-archive-meta-ia-loaded-id'] = ia
+
+    for num, s in enumerate(subjects):
+        headers['x-archive-meta%02d-subject' % (num + 1)] = s
+
+    if boxid:
+        headers['x-archive-meta-ia-box-id'] = boxid
+
+    print(import_api_url)
+    h1 = httplib.HTTPConnection('openlibrary.org')
+    #h1.set_debuglevel(1)
+    h1.request('POST', import_api_url, marc_data, headers)
+    try:
+        res = h1.getresponse()
+    except httplib.BadStatusLine:
+        raise BadImport
+    body = res.read()
+    if res.status != 200:
+        raise BadImport
+    else:
+        try:
+            reply = json.loads(body)
+        except ValueError:
+            print(('not JSON:', repr(body)))
+            raise BadImport
+    assert res.status == 200
+    print(reply, file=logfile)
+    print(reply)
+    if not reply['success'] and reply['error'].startswith('invalid language code:'):
+        raise BadLang
+    assert reply['success']
+    h1.close()
+
+def check_marc_data(marc_data):
+    if marc_data == '':
+        return 'MARC binary empty string'
+    if is_display_marc(marc_data):
+        return 'display MARC'
+    try:
+        length = int(marc_data[0:5])
+    except ValueError:
+        return "MARC doesn't start with number"
+    double_encode = False
+    if len(marc_data) != length:
+        try:
+            marc_data = marc_data.decode('utf-8').encode('raw_unicode_escape')
+            double_encode = True
+        except:
+            return "double UTF-8 decode error"
+    if len(marc_data) != length:
+        return 'MARC length mismatch: %d != %d' % (len(marc_data), length)
+    if str(marc_data)[6:8] != 'am': # only want books
+        return 'not a book!'
+    if double_encode:
+        return 'double encoded'
+    return None
+
+def load_book(ia, collections, boxid, scanned=True):
+    if ia.startswith('annualreportspri'):
+        print('skipping:', ia)
+        return
+    if 'shenzhentest' in collections:
+        return
+
+    if any('census' in c for c in collections):
+        print('skipping census')
+        return
+
+    if re_census.match(ia) or ia.startswith('populationschedu') or ia.startswith('michigancensus') or 'census00reel' in ia or ia.startswith('populationsc1880'):
+        print('ia:', ia)
+        print('collections:', list(collections))
+        print('census not marked correctly')
+        return
+    try:
+        host, path = find_item(ia)
+    except socket.timeout:
+        print('socket timeout:', ia)
+        return
+    except FindItemError:
+        print('find item error:', ia)
+    bad_binary = None
+    try:
+        formats = marc_formats(ia, host, path)
+    except urllib.error.HTTPError as error:
+        return
+
+    if formats['bin']: # binary MARC
+        marc_data = get_marc_ia_data(ia, host, path)
+        assert isinstance(marc_data, str)
+        marc_error = check_marc_data(marc_data)
+        if marc_error == 'double encode':
+            marc_data = marc_data.decode('utf-8').encode('raw_unicode_escape')
+            marc_error = None
+        if marc_error:
+            return
+        contenttype = 'application/marc'
+    elif formats['xml']: # MARC XML
+        return # waiting for Raj to fox MARC XML loader
+        marc_data = urllib.request.urlopen('http://' + host + path + '/' + ia + '_meta.xml').read()
+        contenttype = 'text/xml'
+    else:
+        return
+    subjects = []
+    if scanned:
+        if 'lendinglibrary' in collections:
+            subjects += ['Protected DAISY', 'Lending library']
+        elif 'inlibrary' in collections:
+            subjects += ['Protected DAISY', 'In library']
+        elif 'printdisabled' in collections:
+            subjects.append('Protected DAISY')
+
+    if not boxid:
+        boxid = None
+    try:
+        post_to_import_api(ia, marc_data, contenttype, subjects, boxid, scanned=scanned)
+    except BadImport:
+        print(ia, file=bad)
+        bad.flush()
+    except BadLang:
+        print(ia, file=bad_lang)
+        bad_lang.flush()
+
+if __name__ == '__main__':
+    skip = 'troubleshootingm00bige'
+    skip = None
+    while True:
+        loaded_start = open('loaded_start').readline()[:-1]
+        print(loaded_start)
+
+        conn = MySQLdb.connect(host=ia_db_host, user=ia_db_user, \
+                passwd=ia_db_pass, db='archive')
+
+        cur = conn.cursor()
+        cur.execute("select " + sql_fields + \
+            " from metadata" + \
+            " where identifier not like '%%test%%' and mediatype='texts'" + \
+                " and (not curatestate='dark' or curatestate is null)" + \
+                " and (collection like 'inlibrary%%' or collection like 'lendinglibrary%%' or (scanner is not null and scancenter is not null and scandate is null))" + \
+                " and updated > %s" + \
+                " order by updated", [loaded_start])
+        t_start = time()
+
+        for ia, contributor, updated, noindex, collection, ia_format, boxid in cur.fetchall():
+            print(updated, ia)
+            if contributor == 'Allen County Public Library Genealogy Center':
+                print('skipping Allen County Public Library Genealogy Center')
+                continue
+            collections = set()
+            if collection:
+                collections = set(i.lower().strip() for i in collection.split(';'))
+
+            q = {'type': '/type/edition', 'ocaid': ia}
+            if ol.query(q):
+                continue
+            q = {'type': '/type/edition', 'ia_loaded_id': ia}
+            if ol.query(q):
+                continue
+            load_book(ia, collections, boxid, scanned=False)
+            print(updated, file=open('loaded_start', 'w'))
+        cur.close()
+
+        scanned_start = open('scanned_start').readline()[:-1]
+        print(scanned_start)
+        cur = conn.cursor()
+        cur.execute("select " + sql_fields + \
+            " from metadata" + \
+            " where mediatype='texts'" + \
+                " and (not curatestate='dark' or curatestate is null)" + \
+                " and format is not null " + \
+                " and (collection like 'inlibrary%%' or collection like 'lendinglibrary%%' or scandate is not null)" + \
+                " and updated > %s" + \
+                " order by updated", [scanned_start])
+        t_start = time()
+
+        for ia, contributor, updated, noindex, collection, ia_format, boxid in cur.fetchall():
+            print(updated, ia)
+            if skip:
+                if ia == skip:
+                    skip = None
+                continue
+            if ia == 'treatiseonhistor00dixo':
+                continue
+            if ia == 'derheiligejohann00nean': # language is 'ge ' should be 'ger'
+                continue
+            if ia == 'lenseignementetl00kuhn': # language is ' fr' should be 'fre'
+                continue
+            if ia == 'recherchesetnote00gali': # language is 'efr' should be 'fre'
+                continue
+            if ia == 'placenamesinstra00macd': # language is 'd  '
+                continue
+            if ia == 'conaantnoanynjia00walk': # language is 'max':
+                continue
+            if 'pdf' not in ia_format.lower():
+                continue # scancenter and billing staff often use format like "%pdf%" as a proxy for having derived
+
+            collections = set()
+            if noindex:
+                if not collection:
+                    continue
+                collections = set(i.lower().strip() for i in collection.split(';'))
+                if not ignore_noindex & collections:
+                    continue
+            if 'inlibrary' not in collections and contributor == 'Allen County Public Library Genealogy Center':
+                print('skipping Allen County Public Library Genealogy Center')
+                continue
+
+            load_book(ia, collections, boxid, scanned=True)
+            print(updated, file=open('scanned_start', 'w'))
+
+        cur.close()
+        secs = time() - t_start
+        mins = secs / 60
+        print("finished %d took mins" % mins)
+        if mins < 30:
+            print('waiting')
+            sleep(60 * 30 - secs)
diff --git a/ia-legacy-importer/importer/status.py b/ia-legacy-importer/importer/status.py
new file mode 100755
index 00000000..f58d6fe6
--- /dev/null
+++ b/ia-legacy-importer/importer/status.py
@@ -0,0 +1,172 @@
+import web
+import simplejson as json
+from pprint import pformat
+from time import time
+from catalog.read_rc import read_rc
+
+from six.moves import urllib
+
+
+urls = (
+    '/', 'index'
+)
+
+app = web.application(urls, globals())
+
+base_url = "http://0.0.0.0:9020/"
+rc = read_rc()
+
+done = ['marc_western_washington_univ', 'marc_miami_univ_ohio', 'bcl_marc', 'marc_oregon_summit_records', 'CollingswoodLibraryMarcDump10-27-2008', 'hollis_marc', 'marc_laurentian', 'marc_ithaca_college', 'marc_cca']
+
+def read_book_count():
+    lines = list(open(rc['book_count']))
+    t0, count0 = [int(i) for i in lines[0].split()]
+    t, count = [int(i) for i in lines[-1].split()]
+    t_delta = time() - t0
+    count_delta = count - count0
+    rec_per_sec = float(count_delta) / t_delta
+    return rec_per_sec, count
+
+files = eval(open('files').read())
+
+def server_read(path):
+    return json.load(urllib.request.urlopen(base_url + path))
+
+def progress(archive, part, pos):
+    total = 0
+    pass_cur = False
+    for f, size in files[archive]:
+        cur = archive + '/' + f
+        if size is None:
+            return (None, None)
+        size = int(size)
+        if cur == part or part == f:
+            pass_cur = True
+        if not pass_cur:
+            pos += size
+        total += size
+    assert pass_cur
+    return (pos, total)
+
+class index:
+    def GET(self): # yes, this is a bit of a mess
+        web.header('Content-Type','text/html; charset=utf-8', unique=True)
+        web.header('Refresh','60', unique=True)
+        page = ''
+        page += "<html>\n<head><title>Import status</title>"
+        page += "<style>th { vertical-align: bottom; text-align: left }</style>"
+        page += "</head><body>"
+        page += "<h1>Import status</h1>"
+#        page += '<p style="padding: 5px; background: lightblue; border: black 1px solid; font-size:125%; font-weight: bold">MARC import is paused during the OCA conference</p>'
+        page += "<b>Done:</b>"
+        page += ', '.join('<a href="http://archive.org/details/%s">%s</a>' % (ia, ia) for ia in done) + '<br>'
+        page += "<table>"
+        page += "<tr><th>Archive ID</th><th>input<br>(rec/sec)</th>"
+        page += "<th>no match<br>(%)</th>"
+        page += "<th>load<br>(rec/sec)</th>"
+#        page += "<th>last update<br>(secs)</th><th>running<br>(hours)</th>"
+        page += "<th>progress</th>"
+        page += "<th>remaining<br>(hours)</th>"
+        page += "<th>remaining<br>(records)</th>"
+        page += "</tr>"
+        cur_time = time()
+        total_recs = 0
+        total_t = 0
+        total_load = 0
+        total_rec_per_sec = 0
+        total_load_per_sec = 0
+        total_future_load = 0
+        for k in server_read('keys'):
+            if k.endswith('2'):
+                continue
+            if k in done:
+                continue
+
+            broken = False
+            q = server_read('store/' + k)
+            t1 = cur_time - q['time']
+            rec_no = q['rec_no']
+            chunk = q['chunk']
+            load_count = q['load_count']
+            rec_per_sec = rec_no / q['t1']
+            load_per_sec = load_count / q['t1']
+            if k in done:
+                page += '<tr bgcolor="#00ff00">'
+                broken = True
+            elif t1 > 600:
+                broken = True
+                page += '<tr bgcolor="red">'
+            elif t1 > 120:
+                broken = True
+                page += '<tr bgcolor="yellow">'
+            else:
+                page += '<tr bgcolor="#00ff00">'
+                total_rec_per_sec += rec_per_sec
+                total_load_per_sec += load_per_sec
+                total_recs += rec_no
+                total_load += load_count
+                total_t += q['t1']
+            page += '<td><a href="http://archive.org/details/%s">%s</a></td>' % (k.rstrip('2'), k)
+#            page += '<td><a href="http://openlibrary.org/show-marc/%s">current record</a></td>' % q['cur']
+#            if 'last_key' in q and q['last_key']:
+#                last_key = q['last_key']
+#                page += '<td><a href="http://openlibrary.org%s">%s</a></td>' % (last_key, last_key[3:])
+#            else:
+#                page += '<td>No key</td>'
+            if k in done:
+                for i in range(5):
+                    page += '<td></td>'
+                page += '<td align="right">100.0%</td>'
+            else:
+                page += '<td align="right">%.2f</td>' % rec_per_sec
+                no_match = float(q['load_count']) / q['rec_no']
+                page += '<td align="right">%.2f%%</td>' % (no_match * 100)
+                page += '<td align="right">%.2f</td>' % load_per_sec
+                hours = q['t1'] / 3600.0
+                page += '<td align="right">%.2f</td>' % hours
+                (pos, total) = progress(k, q['part'], q['pos'])
+                if pos:
+                    page += '<td align="right">%.2f%%</td>' % (float(pos * 100) / total)
+                else:
+                    page += '<td align="right">n/a</td>'
+                if 'bytes_per_sec_total' in q and total is not None and pos:
+                    remaining_bytes = total - pos
+                    sec = remaining_bytes / q['bytes_per_sec_total']
+                    hours = sec / 3600
+                    days = hours / 24
+                    page += '<td align="right">%.2f</td>' % hours
+                    total_bytes = q['bytes_per_sec_total'] * q['t1']
+                    avg_bytes = total_bytes / q['rec_no']
+                    future_load = ((remaining_bytes / avg_bytes) * no_match)
+                    total_future_load += future_load
+                    page += '<td align="right">%s</td>' % web.commify(int(future_load))
+                else:
+                    page += '<td></td>'
+
+            page += '</tr>'
+        page += '<tr><td>Total</td><td align="right">%.2f</td>' % total_rec_per_sec
+        if total_recs:
+            page += '<td align="right">%.2f%%</td>' % (float(total_load * 100.0) / total_recs)
+        else:
+            page += '<td align="right"></td>'
+        page += '<td align="right">%.2f</td>' % total_load_per_sec
+        page += '<td></td>' * 3 + '<td align="right">%s</td>' % web.commify(int(total_future_load))
+        page += '</tr></table>'
+#        page += "<table>"
+#        page += '<tr><td align="right">loading:</td><td align="right">%.1f</td><td>rec/hour</td></tr>' % (total_load_per_sec * (60 * 60))
+#        page += '<tr><td align="right">loading:</td><td align="right">%.1f</td><td>rec/day</td></tr>' % (total_load_per_sec * (60 * 60 * 24))
+#        if total_load_per_sec:
+#            page += '<tr><td>one million records takes:</td><td align="right">%.1f</td><td>hours</td></tr>' % ((1000000 / total_load_per_sec) / (60 * 60))
+#            page += '<tr><td>one million records takes:</td><td align="right">%.1f</td><td>days</td></tr>' % ((1000000 / total_load_per_sec) / (60 * 60 * 24))
+#        page += "</table>"
+        rec_per_sec, count = read_book_count()
+        page += "Total records per second: %.2f<br>" % rec_per_sec
+        day = web.commify(int(rec_per_sec * (60 * 60 * 24)))
+        page += "Total records per day: %s<br>" % day
+
+        page += "Books in Open Library: " + web.commify(count) + "<br>"
+        page += '</body>\n<html>'
+        return page
+
+if __name__ == '__main__':
+    app.run()
diff --git a/ia-legacy-importer/importer/update.py b/ia-legacy-importer/importer/update.py
new file mode 100644
index 00000000..3df037ac
--- /dev/null
+++ b/ia-legacy-importer/importer/update.py
@@ -0,0 +1,147 @@
+from __future__ import print_function
+import re
+import web
+import sys
+import simplejson as json
+from openlibrary.catalog.read_rc import read_rc
+from openlibrary.catalog.importer.db_read import get_mc
+from time import sleep
+from openlibrary.catalog.title_page_img.load import add_cover_image
+from openlibrary.api import OpenLibrary, unmarshal, marshal
+
+import six
+from six.moves.urllib.error import URLError
+from six.moves.urllib.request import urlopen
+
+rc = read_rc()
+ol = OpenLibrary("http://openlibrary.org")
+ol.login('ImportBot', rc['ImportBot'])
+
+re_meta_mrc = re.compile('^([^/]*)_meta.mrc:0:\d+$')
+
+def make_redirect(old, new, msg='replace with redirect'):
+    r = {'type': {'key': '/type/redirect'}, 'location': new}
+    ol.save(old, r, msg)
+
+def fix_toc(e):
+    toc = e.get('table_of_contents', None)
+    if not toc:
+        return
+    print(e['key'])
+    # http://openlibrary.org/books/OL789133M - /type/toc_item missing from table_of_contents
+    if isinstance(toc[0], dict) and ('pagenum' in toc[0] or toc[0]['type'] == '/type/toc_item'):
+        return
+    return [{'title': six.text_type(i), 'type': '/type/toc_item'} for i in toc if i != u'']
+
+re_skip = re.compile('\b([A-Z]|Co|Dr|Jr|Capt|Mr|Mrs|Ms|Prof|Rev|Revd|Hon)\.$')
+
+def has_dot(s):
+    return s.endswith('.') and not re_skip.search(s)
+
+def undelete_author(a):
+    key = a['key']
+    assert a['type'] == '/type/delete'
+    url = 'http://openlibrary.org' + key + '.json?v=' + str(a['revision'] - 1)
+    prev = unmarshal(json.load(urlopen(url)))
+    assert prev['type'] == '/type/author'
+    ol.save(key, prev, 'undelete author')
+
+def undelete_authors(authors):
+    for a in authors:
+        if a['type'] == '/type/delete':
+            undelete_author(a)
+        else:
+            print(a)
+            assert a['type'] == '/type/author'
+
+re_edition_key = re.compile('^/b(?:ooks)?/(OL\d+M)')
+
+def add_source_records(key, ia, v=None):
+    new = 'ia:' + ia
+    sr = None
+    m = re_edition_key.match(key)
+    old_style_key = '/b/' + m.group(1)
+    key = '/books/' + m.group(1)
+    e = ol.get(key, v=v)
+    need_update = False
+    if 'ocaid' not in e:
+        need_update = True
+        e['ocaid'] = ia
+    if 'source_records' in e:
+        if new in e['source_records'] and not need_update:
+            return
+        e['source_records'].append(new)
+    else:
+        existing = get_mc(old_style_key)
+        print('get_mc(%s) == %s' % (old_style_key, existing))
+        if existing is None:
+            sr = []
+        elif existing.startswith('ia:') or existing.startswith('amazon:'):
+            sr = [existing]
+        else:
+            m = re_meta_mrc.match(existing)
+            sr = ['marc:' + existing if not m else 'ia:' + m.group(1)]
+        print('ocaid:', e['ocaid'])
+        if 'ocaid' in e and 'ia:' + e['ocaid'] not in sr:
+            sr.append('ia:' + e['ocaid'])
+        print('sr:', sr)
+        print('ocaid:', e['ocaid'])
+        if new not in sr:
+            e['source_records'] = sr + [new]
+        else:
+            e['source_records'] = sr
+        assert 'source_records' in e
+
+    # fix other bits of the record as well
+    new_toc = fix_toc(e)
+    if new_toc:
+        e['table_of_contents'] = new_toc
+    if e.get('subjects', None) and any(has_dot(s) for s in e['subjects']):
+        subjects = [s[:-1] if has_dot(s) else s for s in e['subjects']]
+        e['subjects'] = subjects
+    if 'authors' in e:
+        assert not any(a=='None' for a in e['authors'])
+        print(e['authors'])
+        authors = [ol.get(akey) for akey in e['authors']]
+        authors = [ol.get(a['location']) if a['type'] == '/type/redirect' else a \
+                for a in authors]
+        for a in authors:
+            if a['type'] == '/type/redirect':
+                print('double redirect on:', e['key'])
+        e['authors'] = [{'key': a['key']} for a in authors]
+        undelete_authors(authors)
+    print('saving', key)
+    assert 'source_records' in e
+    print(ol.save(key, e, 'found a matching MARC record'))
+    add_cover_image(key, ia)
+
+def ocaid_and_source_records(key, ocaid, source_records):
+    e = ol.get(key)
+    need_update = False
+    e['ocaid'] = ocaid
+    e['source_records'] = source_records
+
+    # fix other bits of the record as well
+    new_toc = fix_toc(e)
+    if new_toc:
+        e['table_of_contents'] = new_toc
+    if e.get('subjects', None) and any(has_dot(s) for s in e['subjects']):
+        subjects = [s[:-1] if has_dot(s) else s for s in e['subjects']]
+        e['subjects'] = subjects
+    if 'authors' in e:
+        assert not any(a=='None' for a in e['authors'])
+        print(e['authors'])
+        authors = [ol.get(akey) for akey in e['authors']]
+        authors = [ol.get(a['location']) if a['type'] == '/type/redirect' else a \
+                for a in authors]
+        e['authors'] = [{'key': a['key']} for a in authors]
+        undelete_authors(authors)
+    try:
+        print(ol.save(key, e, 'merge scanned books'))
+    except:
+        print(e)
+        raise
+    if new_toc:
+        new_edition = ol.get(key)
+        # [{u'type': <ref: u'/type/toc_item'>}, ...]
+        assert 'title' in new_edition['table_of_contents'][0]
diff --git a/ia-legacy-importer/improve/improve_data.py b/ia-legacy-importer/improve/improve_data.py
new file mode 100644
index 00000000..570d97e4
--- /dev/null
+++ b/ia-legacy-importer/improve/improve_data.py
@@ -0,0 +1,22 @@
+from __future__ import print_function
+from catalog.infostore import get_site
+import sys
+import codecs
+
+sys.stdout = codecs.getwriter('utf-8')(sys.stdout)
+
+site = get_site()
+
+def get_authors_by_name(name):
+    return site.things({'name': name, 'type': '/type/author'})
+
+def get_books_by_author(key):
+    return site.things({'authors': key, 'type': '/type/edition'})
+
+for author_key in get_authors_by_name(sys.argv[1]):
+    print(author_key)
+    book_keys = get_books_by_author(author_key)
+    for key in book_keys:
+        t = site.get(key)
+        print(key, t.title)
+        print('  ', t.isbn_10)
diff --git a/ia-legacy-importer/improve/web_ui.py b/ia-legacy-importer/improve/web_ui.py
new file mode 100644
index 00000000..adee396c
--- /dev/null
+++ b/ia-legacy-importer/improve/web_ui.py
@@ -0,0 +1,61 @@
+from __future__ import print_function
+from catalog.infostore import get_site
+import web
+from catalog.marc.db.web_marc_db import search_query, show_locs
+
+site = get_site()
+
+def get_authors_by_name(name):
+    return site.things({'name': name, 'type': '/type/author'})
+
+def get_books_by_author(key):
+    return site.things({'authors': key, 'type': '/type/edition'})
+
+def author_search(author_key):
+    book_keys = get_books_by_author(author_key)
+    for key in book_keys:
+        t = site.get(key)
+        print(key, t.title, '<br>')
+        print('&nbsp;&nbsp;', t.isbn_10, '<br>')
+        locs = []
+        for i in t.isbn_10 if t.isbn_10 else []:
+            for l in search_query('isbn', i):
+                if l not in locs:
+                    locs.append(l)
+        for i in t.lccn if t.lccn else []:
+            for l in search_query('lccn', i):
+                if l not in locs:
+                    locs.append(l)
+        show_locs(locs, None)
+
+urls = (
+    '/', 'index'
+)
+
+class index():
+    def GET(self):
+        web.header('Content-Type','text/html; charset=utf-8', unique=True)
+        input = web.input()
+        author_key = input.get('author', None)
+        print("<html>\n<head>\n<title>Author fixer</title>")
+        print('''
+<style>
+th { text-align: left }
+td { padding: 5px; background: #eee }
+</style>''')
+
+        print('</head><body><a name="top">')
+        print('<form name="main" method="get">')
+        if author_key:
+            print('<input type="text" name="author" value="%s">' % web.htmlquote(author_key))
+        else:
+            print('<input type="text" name="author">')
+        print('<input type="submit" value="find">')
+        print('</form>')
+        if author_key:
+            author_search(author_key)
+        print("</body></html>")
+
+
+if __name__ == "__main__":
+    web.run(urls, globals(), web.reloader)
diff --git a/ia-legacy-importer/infostore.py b/ia-legacy-importer/infostore.py
new file mode 100644
index 00000000..e11c67b9
--- /dev/null
+++ b/ia-legacy-importer/infostore.py
@@ -0,0 +1,49 @@
+from __future__ import print_function
+import web
+web.config.db_printing = False
+from infogami.infobase import cache
+import infogami
+from read_rc import read_rc
+
+def get_infobase(rc):
+    from infogami.infobase import infobase, dbstore
+    import web
+    web.config.db_parameters = infogami.config.db_parameters
+    web.config.db_printing = False
+
+    schema = dbstore.Schema()
+    schema.add_table_group('type', '/type/type')
+    schema.add_table_group('type', '/type/property')
+    schema.add_table_group('type', '/type/backreference')
+    schema.add_table_group('user', '/type/user')
+    schema.add_table_group('user', '/type/usergroup')
+    schema.add_table_group('user', '/type/permission')
+
+    schema.add_table_group('edition', '/type/edition')
+    schema.add_table_group('author', '/type/author')
+    schema.add_table_group('scan', '/type/scan_location')
+    schema.add_table_group('scan', '/type/scan_record')
+
+    schema.add_seq('/type/edition', '/b/OL%dM')
+    schema.add_seq('/type/author', '/a/OL%dA')
+
+    store = dbstore.DBStore(schema)
+    secret_key = rc['secret_key']
+    return infobase.Infobase(store, secret_key)
+
+def get_site(staging=False):
+    if 'site' in web.ctx:
+        return web.ctx.site
+    rc = read_rc()
+
+    param = dict((k, rc['staging_' + k if staging else k]) for k in ('db', 'user', 'pw', 'host'))
+    print(param)
+    param['dbn'] = 'postgres'
+
+    infogami.config.db_parameters = param
+    infogami.config.db_printing = False
+
+    ib = get_infobase(rc)
+    web.ctx.site = ib.get('openlibrary.org')
+    cache.loadhook()
+    return web.ctx.site
diff --git a/ia-legacy-importer/iter_scan_records.py b/ia-legacy-importer/iter_scan_records.py
new file mode 100644
index 00000000..01e45eaa
--- /dev/null
+++ b/ia-legacy-importer/iter_scan_records.py
@@ -0,0 +1,44 @@
+from __future__ import print_function
+from catalog.read_rc import read_rc
+from catalog.infostore import get_site
+from catalog.get_ia import get_from_archive
+from catalog.marc.fast_parse import get_all_tag_lines
+import os
+
+site = get_site()
+
+marc_path = '/2/pharos/marc/'
+
+def get_data(loc):
+    try:
+        filename, p, l = loc.split(':')
+    except ValueError:
+        return None
+    if not os.path.exists(marc_path + filename):
+        return None
+    f = open(marc_path + filename)
+    f.seek(int(p))
+    buf = f.read(int(l))
+    f.close()
+    return buf
+
+
+def edition_marc(key):
+    mc = list(set(v.machine_comment for v in site.versions({'key': key })))
+    return [loc for loc in mc if loc]
+
+key_start = len('/scan_record')
+for key in site.things({'type': '/type/scan_record'}):
+    assert key.startswith('/scan_record/b/')
+    edition_key = key[key_start:]
+    for loc in edition_marc(edition_key):
+        data = get_data(loc)
+        if not data or data.find('icrof') == -1:
+            continue
+        print("http://openlibrary.org" + edition_key)
+        print("http://openlibrary.org/show-marc/" + loc)
+        for tag, tag_line in get_all_tag_lines(data):
+            if tag_line.find('icrof') == -1:
+                continue
+            print(tag + ":", tag_line[2:-1].replace('\x1f', ' $'))
+        print()
diff --git a/ia-legacy-importer/lang.py b/ia-legacy-importer/lang.py
new file mode 100644
index 00000000..860c00af
--- /dev/null
+++ b/ia-legacy-importer/lang.py
@@ -0,0 +1,51 @@
+import sys
+from six import StringIO
+import time
+import re
+
+def cftime():
+    t,m = divmod(time.time(), 1.0)
+    return re.sub(r':\d\d ', r'\1.%02d ',
+                  (time.ctime(t), int(100*m)))
+
+def warn (msg):
+    sys.stderr.write ("%s\n" % msg)
+
+def die (msg):
+    raise Exception (msg)
+
+def lines_positions (input):
+    done = False
+    while not done:
+        line = StringIO ()
+        pos = input.tell ()
+        while True:
+            ch = input.read (1)
+            if len (ch) == 0:
+                done = True
+                break
+            elif ch == '\n':
+                break
+            else:
+                line.write (ch)
+        yield (line.getvalue (), pos)
+
+class Box:
+    def __init__ (self):
+        self.empty = True
+    def set (self, val):
+        self.value = val
+        self.empty = False
+    def get (self):
+        if self.empty:
+            raise Exception ("get: box is empty")
+        else:
+            return self.value
+
+def memoized (f):
+    box = Box ()
+    def get ():
+        if box.empty:
+            box.set (f ())
+        return box.get ()
+    return get
diff --git a/ia-legacy-importer/lc_updates/get.pl b/ia-legacy-importer/lc_updates/get.pl
new file mode 100644
index 00000000..a3dbabc6
--- /dev/null
+++ b/ia-legacy-importer/lc_updates/get.pl
@@ -0,0 +1,36 @@
+#!/usr/bin/perl
+use strict;
+use warnings;
+
+use Net::FTP;
+
+my $host = 'rs7.loc.gov';
+open my $fh, '/home/edward/.olrc' or die $!;
+my %auth;
+while (<$fh>) {
+    /^lc_update_(user|pass) = '(.*)'$/ and $auth{$1} = $2;
+}
+close $fh;
+
+my $dir = '/emds/books/all';
+my $out_dir = '/1/edward/lc_updates/';
+
+print "connecting to host: $host\n";
+my $ftp = Net::FTP->new($host) or die "Cannot connect to some.host.name: $@";
+$ftp->login($auth{user}, $auth{pass}) or die "Cannot login ", $ftp->message;
+print "login complete\n";
+$ftp->binary() or die $ftp->message;
+$ftp->cwd($dir) or die "Cannot change working directory ", $ftp->message;
+my @ls = $ftp->ls() or die "ls failed ", $ftp->message;
+my $download_num = 0;
+chdir $out_dir;
+for (@ls) {
+    -e $_ and next;
+    $download_num++;
+    print "$_\n";
+    $ftp->get($_) or die $ftp->message;
+}
+
+$ftp->quit;
+
+print "$download_num\n";
diff --git a/ia-legacy-importer/lc_updates/update.py b/ia-legacy-importer/lc_updates/update.py
new file mode 100644
index 00000000..17839c97
--- /dev/null
+++ b/ia-legacy-importer/lc_updates/update.py
@@ -0,0 +1,65 @@
+from __future__ import print_function
+from lxml.html import parse
+from openlibrary.catalog.read_rc import read_rc
+import os
+import sys
+import httplib
+import subprocess
+from time import sleep
+
+from six.moves.urllib.request import urlopen
+
+
+# httplib.HTTPConnection.debuglevel = 1
+
+# http://home.us.archive.org/~samuel/abouts3.txt
+
+rc = read_rc()
+accesskey = rc['s3_accesskey']
+secret = rc['s3_secret']
+no_bucket_error = '<Code>NoSuchBucket</Code>'
+internal_error = '<Code>InternalError</Code>'
+
+
+def put_file(con, ia, filename):
+    print('uploading %s' % filename)
+    headers = {
+        'authorization': "LOW " + accesskey + ':' + secret,
+        'x-archive-queue-derive': 0,
+    }
+    url = 'http://s3.us.archive.org/' + ia + '/' + filename
+    print(url)
+    data = open(d + '/' + filename).read()
+    for attempt in range(5):
+        con.request('PUT', url, data, headers)
+        try:
+            res = con.getresponse()
+        except httplib.BadStatusLine as bad:
+            print('bad status line:', bad.line)
+            raise
+        body = res.read()
+        if '<Error>' not in body:
+            return
+        print('error')
+        print(body)
+        if no_bucket_error not in body and internal_error not in body:
+            sys.exit(0)
+        print('retry')
+        sleep(5)
+    print('too many failed attempts')
+
+subprocess.call(["/usr/bin/perl", "get.pl"])
+
+d = '/1/edward/lc_updates'
+item_id = 'marc_loc_updates'
+url = 'http://www.archive.org/download/' + item_id
+existing = frozenset(l[2] for l in parse(url).getroot().iterlinks())
+
+to_upload = set(os.listdir(d)) - existing
+
+for f in to_upload:
+    con = httplib.HTTPConnection('s3.us.archive.org')
+    con.connect()
+    put_file(con, item_id, f)
+    con.close()
+    sleep(10)
diff --git a/ia-legacy-importer/load.py b/ia-legacy-importer/load.py
new file mode 100644
index 00000000..eb3c0a3a
--- /dev/null
+++ b/ia-legacy-importer/load.py
@@ -0,0 +1,70 @@
+from __future__ import print_function
+
+type_map = {
+    'description': 'text',
+    'notes': 'text',
+    'number_of_pages': 'int',
+    'url': 'uri',
+}
+
+def get_author_num(web):
+    # find largest author key
+    rows = web.query("select key from thing where site_id=1 and key LIKE '/a/OL%%A' order by id desc limit 10")
+    return max(int(web.numify(i.key)) for i in rows)
+
+def get_edition_num(web):
+    # find largest edition key
+    rows = web.query("select key from thing where site_id=1 and key LIKE '/b/OL%%M' order by id desc limit 10")
+    return max(int(web.numify(i.key)) for i in rows)
+
+def add_keys(web, edition):
+    # add author and edition keys to a new edition
+    if 'authors' in edition:
+        for a in edition['authors']:
+            a.setdefault('key', '/a/OL%dA' % (get_author_num(web) + 1))
+    edition['key'] = '/b/OL%dM' % (get_edition_num(web) + 1)
+
+def build_query(loc, rec):
+    if 'title' not in rec:
+        print('missing title:', loc)
+        return
+    if 'edition_name' in rec:
+        assert rec['edition_name']
+    assert 'source_record_loc' not in rec
+
+    book = {
+        'create': 'unless_exists',
+        'type': { 'key': '/type/edition'},
+    }
+
+    east = east_in_by_statement(rec)
+    if east:
+        print(rec)
+
+    for k, v in rec.iteritems():
+        if k == 'authors':
+            book[k] = [import_author(v[0], eastern=east)]
+            continue
+        if k in type_map:
+            t = '/type/' + type_map[k]
+            if isinstance(v, list):
+                book[k] = [{'type': t, 'value': i} for i in v]
+            else:
+                book[k] = {'type': t, 'value': v}
+        else:
+            book[k] = v
+
+    assert 'title' in book
+    if 'publish_country' in book:
+        assert book['publish_country'] not in ('   ', '|||')
+    if 'publish_date' in book:
+        assert book['publish_date'] != '||||'
+    if 'languages' in book:
+        lang_key = book['languages'][0]['key']
+        if lang_key in ('/l/   ', '/l/|||'):
+            del book['languages']
+        elif not site.things({'key': lang_key, 'type': '/type/language'}):
+            print(lang_key, "not found for", loc)
+            del book['languages']
+    return book
+
diff --git a/ia-legacy-importer/marc/__init__.py b/ia-legacy-importer/marc/__init__.py
new file mode 100644
index 00000000..a45ada7a
--- /dev/null
+++ b/ia-legacy-importer/marc/__init__.py
@@ -0,0 +1,29 @@
+"""marc"""
+import re
+
+re_leader = re.compile(r'^\d{5}.{19}$')
+re_control = re.compile(r'\d{3} ')
+re_data = re.compile(r'\d{3} (..) \$')
+
+def is_display_marc(data):
+    if data.startswith('(Length implementation at offset 22 should hold a digit. Assuming 0)'):
+        return True
+    try:
+        lines = data.split('\n')
+        leader = lines[0]
+        assert re_leader.match(leader)
+        for line in lines[1:]:
+            if line.startswith('00'):
+                assert re_control.match(line)
+            else:
+                assert re_data.match(line)
+        return True
+    except AssertionError:
+        return False
+
+def test_is_display_marc():
+    samples = [
+        ('melbaysdeluxehar00dunc', "00628nam  2200157 a 4500\n008\n020    $a 0871663821\n100 1  $a Duncan, Phil.\n245 10 $a Mel Bay's deluxe harmonica method $b a thorough study for the individual or group/ $c Phil Duncan.\n260    $a Pacific, MO : $b Mel Bay, $c 1981.\n300    $a 108 p. : $b ill.\n650  0 $a Harmonica $v Methods $v Self-instruction.\n650  0 $a Harmonica music.\n907    $a .b14612021 $b 02-17-04 $c 02-17-04\n998    $a 3cw $b 02-17-04 $c m $d a $e - $f eng $g us  $h 0 $i 1\n945    $a 788.82193 Dun $g 0 $i 36431100583926 $l 3cwan $o   $p $8.00 $q   $r   $s - $t 201 $u 0 $v 0 $w 0 $x 0 $y .i18341184 $z 02-17-04"),
+        ('howtodeal00dess', '00760nam  2200205   4500\n008\n020    $a 0142501034\n100 1  $a Dessen, Sarah.\n245 10 $a How to deal / $c Sarah Dessen.\n260    $a New York : $c 2003.\n300    $a 486 p.\n650  0 $a Pregnancy $v Fiction.\n650  0 $a Unmarried moters $v Fiction.\n605  0 $a Friendship $v Fiction.\n907    $a .b14124932 $b 08-13-04 $c 07-08-03\n998    $a 3cw $a 4gc $b 07-08-03 $c m $d a $e   $f eng $g us  $h 0 $i 1\n946    $a cw $b jaj $c 2003-07-08\n947    $a gc $b cm $c 2003-09-04\n945    $a PAP Y Fic Des $g 0 $i 36431100561534 $l 3cwjp $o   $p $7.00 $q   $r   $s - $t 206 $u 17 $v 2 $w 2 $x 3 $y .i17522845 $z 07-08-03\n945    $a Fic $b Dessen $g 0 $i 39562100662679 $l 4gc   $o   $p $7.99 $q   $r   $s - $t 130 $u 7 $v 0 $w 0 $x 2 $y .i18029565 $z 09-04-03'),
+    ]
+
diff --git a/ia-legacy-importer/marc/all.py b/ia-legacy-importer/marc/all.py
new file mode 100644
index 00000000..31a4b7bf
--- /dev/null
+++ b/ia-legacy-importer/marc/all.py
@@ -0,0 +1,32 @@
+from openlibrary.catalog.get_ia import read_marc_file
+from openlibrary.catalog.read_rc import read_rc
+import web
+import os.path
+
+# iterate through every MARC record on disk
+
+rc = read_rc()
+
+def files(ia):
+    endings = ['.mrc', '.marc', '.out', '.dat', '.records.utf8']
+    def good(filename):
+        return any(filename.endswith(e) for e in endings)
+
+    dir = rc['marc_path'] + '/' + ia
+    dir_len = len(dir) + 1
+    files = []
+    for dirpath, dirnames, filenames in os.walk(dir):
+        files.extend(dirpath + "/" + f for f in sorted(filenames))
+    return [(i[dir_len:], os.path.getsize(i)) for i in files if good(i)]
+
+def iter_marc(sources):
+    rec_no = 0
+    for ia in sources:
+        for part, size in files(ia):
+            full_part = ia + "/" + part
+            filename = rc['marc_path'] + full_part
+            assert os.path.exists(filename)
+            f = open(filename)
+            for pos, loc, data in read_marc_file(full_part, f):
+                rec_no +=1
+                yield rec_no, pos, loc, data
diff --git a/ia-legacy-importer/marc/build_db.py b/ia-legacy-importer/marc/build_db.py
new file mode 100644
index 00000000..06ecdb98
--- /dev/null
+++ b/ia-legacy-importer/marc/build_db.py
@@ -0,0 +1,64 @@
+from __future__ import print_function
+from sources import sources
+from catalog.marc.fast_parse import index_fields, read_file
+from catalog.get_ia import files
+from catalog.read_rc import read_rc
+from time import time
+import os
+import web
+
+rc = read_rc()
+
+web.config.db_parameters = dict(dbn='postgres', db='marc_records', user=rc['user'], pw=rc['pw'], host=rc['host'])
+web.config.db_printing = False
+web.load()
+
+def progress_update(rec_no, t):
+    remaining = total - rec_no
+    rec_per_sec = chunk / t
+    mins = (float((t/chunk) * remaining) / 60)
+    print("%d %.3f rec/sec" % (rec_no, rec_per_sec), end=' ')
+    if mins > 1440:
+        print("%.3f days left" % (mins / 1440))
+    elif mins > 60:
+        print("%.3f hours left" % (mins / 60))
+    else:
+        print("%.3f minutes left" % mins)
+
+fields = ['isbn', 'oclc', 'lccn', 'call_number', 'title']
+
+def process_record(file_id, pos, length, data):
+    rec = index_fields(data, ['001', '010', '020', '035', '245'], check_author = False)
+    if not rec:
+        return
+    extra = dict((f, rec[f][0]) for f in ('title', 'lccn', 'call_number') if f in rec)
+    rec_id = web.insert('rec', marc_file = file_id, pos=pos, len=length, **extra)
+    for f in (f for f in ('isbn', 'oclc') if f in rec):
+        for v in rec[f]:
+            web.insert(f, seqname=False, rec=rec_id, value=v)
+
+t_prev = time()
+rec_no = 0
+chunk = 1000
+total = 32856039
+
+for ia, name in sources():
+    print(ia, name)
+    for part, size in files(ia):
+        file_id = web.insert('files', ia=ia, part=part)
+        print(part, size)
+        full_part = ia + "/" + part
+        filename = rc['marc_path'] + full_part
+        if not os.path.exists(filename):
+            continue
+        pos = 0
+        for data, length in read_file(open(filename)):
+            pos += length
+            rec_no +=1
+            if rec_no % chunk == 0:
+                t = time() - t_prev
+                progress_update(rec_no, t)
+                t_prev = time()
+            process_record(file_id, pos, length, data)
+
+print(rec_no)
diff --git a/ia-legacy-importer/marc/build_record.py b/ia-legacy-importer/marc/build_record.py
new file mode 100644
index 00000000..a0846f3b
--- /dev/null
+++ b/ia-legacy-importer/marc/build_record.py
@@ -0,0 +1,560 @@
+""" This entire module is deprecated,
+    openlibrary.catalog.marc.parse is the preferred module
+"""
+
+# Tell the flake8 linter to ignore this deprecated file.
+# flake8: noqa
+
+import re
+from deprecated import deprecated
+from warnings import warn
+
+from openlibrary.catalog.utils import pick_first_date
+
+re_question = re.compile('^\?+$')
+re_lccn = re.compile('(...\d+).*')
+re_letters = re.compile('[A-Za-z]')
+re_isbn = re.compile('([^ ()]+[\dX])(?: \((?:v\. (\d+)(?: : )?)?(.*)\))?')
+re_oclc = re.compile ('^\(OCoLC\).*?0*(\d+)')
+re_int = re.compile ('\d{2,}')
+re_number_dot = re.compile('\d{3,}\.$')
+
+re_translation1 = re.compile(r'^(.{,6})\btranslation of\b', re.I)
+re_translation2 = re.compile(r'^([\'"]?).*?\btranslation of\b[ :,;]*(.*)\1', re.I)
+
+# no monograph should be longer than 50,000 pages
+max_number_of_pages = 50000
+
+want = [
+    '001',
+    '008', # publish date, country and language
+    '010', # lccn
+    '020', # isbn
+    '035', # oclc
+    '050', # lc classification
+    '082', # dewey
+    '100', '110', '111', # authors
+    '130', '240', # work title
+    '245', # title
+    '250', # edition
+    '260', # publisher
+    '300', # pagination
+    '440', '490', '830' # series
+    ] + map(str, range(500,590)) + [ # notes + toc + description
+    '600', '610', '630', '650', '651', # subjects + genre
+    '700', '710', '711', # contributions
+    '246', '730', '740', # other titles
+    '852', # location
+    '856' # URL
+]
+
+re_series = re.compile('^(.*) series$', re.I)
+REASON = 'Use corresponding function in openlibrary.catalog.marc.parse instead.'
+
+@deprecated(REASON)
+def read_lccn(fields):
+    if '010' not in fields:
+        return {}
+    found = []
+    for line in fields['010']:
+        for k, v in get_subfields(line, ['a']):
+            lccn = v.strip()
+            if re_question.match(lccn):
+                continue
+            m = re_lccn.search(lccn)
+            if not m:
+                continue
+            lccn = re_letters.sub('', m.group(1)).strip()
+            if lccn:
+                found.append(lccn)
+
+    return {'lccn': found}
+
+@deprecated(REASON)
+def read_isbn(fields):
+    if '020' not in fields:
+        return {}
+
+    found = []
+    for line in fields['020']:
+        if line.find('\x1f') != -1:
+            for k, v in get_subfields(line, ['a', 'z']):
+                m = re_isbn.match(v)
+                if m:
+                    found.append(m.group(1))
+        else:
+            m = re_isbn.match(line[3:-1])
+            if m:
+                found.append(m.group(1))
+    ret = {}
+    for i in found:
+        i = i.replace('-', '')
+        if len(i) == 13:
+            ret.setdefault('isbn_13', []).append(i)
+        else:
+            ret.setdefault('isbn_10', []).append(i)
+    return ret
+
+@deprecated(REASON)
+def read_oclc(fields):
+    if '035' not in fields:
+        return {}
+
+    found = []
+    for line in fields['035']:
+        for v in get_subfield_values(line, ['a']):
+            m = re_oclc.match(v)
+            if not m:
+                continue
+            oclc = m.group(1)
+            if oclc not in found:
+                found.append(oclc)
+    return {'oclc_number': found } if found else {}
+
+@deprecated(REASON)
+def read_author_person(line):
+    author = {}
+    contents = get_contents(line, ['a', 'b', 'c', 'd'])
+    if 'a' not in contents and 'c' not in contents:
+        return None # should at least be a name or title
+    name = [v.strip(' /,;:') for v in get_subfield_values(line, ['a', 'b', 'c'])]
+    if 'd' in contents:
+        author = pick_first_date(contents['d'])
+        if 'death_date' in author and author['death_date']:
+            death_date = author['death_date']
+            if re_number_dot.search(death_date):
+                author['death_date'] = death_date[:-1]
+
+    author['name'] = ' '.join(name)
+    author['entity_type'] = 'person'
+    subfields = [
+        ('a', 'personal_name'),
+        ('b', 'numeration'),
+        ('c', 'title')
+    ]
+    for subfield, field_name in subfields:
+        if subfield in contents:
+            author[field_name] = ' '.join([x.strip(' /,;:') for x in contents[subfield]])
+    if 'q' in contents:
+        author['fuller_name'] = ' '.join(contents['q'])
+    return author
+
+@deprecated(REASON)
+def read_authors(fields):
+    found = []
+    author = [tag for tag in fields if tag in ('100', '110', '111')]
+    if len(author) == 0:
+        return {}
+    assert len(author) == 1
+    if '100' in fields:
+        line = fields['100'][0]
+        author = read_author_person(line)
+    if '110' in fields:
+        line = fields['110'][0]
+        name = [v.strip(' /,;:') for v in get_subfield_values(line, ['a', 'b'])]
+        author = { 'entity_type': 'org', 'name': ' '.join(name) }
+    if '111' in fields:
+        line = fields['111'][0]
+        name = [v.strip(' /,;:') for v in get_subfield_values(line, ['a', 'c', 'd', 'n'])]
+        author = { 'entity_type': 'event', 'name': ' '.join(name) }
+
+    return {'authors': [author]} if author else {}
+
+@deprecated(REASON)
+def read_title(fields):
+    if '245' not in fields:
+        return {}
+
+#   example MARC record with multiple titles:
+#   http://openlibrary.org/show-marc/marc_western_washington_univ/wwu_bibs.mrc_revrev.mrc:299505697:862
+#   assert len(fields['245']) == 1
+    line = fields['245'][0]
+    contents = get_contents(line, ['a', 'b', 'c', 'h'])
+
+    edition = {}
+    title = None
+#   MARC record with 245a missing:
+#   http://openlibrary.org/show-marc/marc_western_washington_univ/wwu_bibs.mrc_revrev.mrc:516779055:1304
+    if 'a' in contents:
+        title = ' '.join(x.strip(' /,;:') for x in contents['a'])
+    elif 'b' in contents: # handle broken records
+        title = contents['b'][0].strip(' /,;:')
+        del contents['b'][0]
+    edition['title'] = title
+    if 'b' in contents and contents['b']:
+        edition["subtitle"] = ' : '.join([x.strip(' /,;:') for x in contents['b']])
+    if 'c' in contents:
+        edition["by_statement"] = ' '.join(contents['c'])
+    if 'h' in contents:
+        edition["physical_format"] = ' '.join(contents['h'])
+    return edition
+
+@deprecated(REASON)
+def read_lc_classification(fields):
+    if '050' not in fields:
+        return {}
+
+    found = []
+    for line in fields['050']:
+        contents = get_contents(line, ['a', 'b'])
+        if 'b' in contents:
+            b = ' '.join(contents['b'])
+            if 'a' in contents:
+                found += [' '.join([a, b]) for a in contents['a']]
+            else:
+                found += [b]
+        # http://openlibrary.org/show-marc/marc_university_of_toronto/uoft.marc:671135731:596
+        elif 'a' in contents:
+            found += contents['a']
+    if found:
+        return {'lc_classifications': [i.strip() for i in found]}
+    else:
+        return {}
+
+@deprecated(REASON)
+def read_dewey(fields):
+    if '082' not in fields:
+        return {}
+    found = []
+    for line in fields['082']:
+        found += get_subfield_values(line, ['a'])
+    return {'dewey_decimal_class': found }
+
+@deprecated(REASON)
+def join_subfield_values(line, subfields):
+    return ' '.join(get_subfield_values(line, subfields))
+
+@deprecated(REASON)
+def read_work_titles(fields):
+    found = []
+    if '240' in fields:
+        for line in fields['240']:
+            title = join_subfield_values(line, ['a', 'm', 'n', 'p', 'r'])
+            if title not in found:
+                found.append(title)
+
+    if '130' in fields:
+        for line in fields['130']:
+            title = ' '.join(get_lower_subfields(line))
+            if title not in found:
+                found.append(title)
+
+    return { 'work_titles': found } if found else {}
+
+@deprecated(REASON)
+def read_edition_name(fields):
+    if '250' not in fields:
+        return {}
+    found = []
+    for line in fields['250']:
+        found += [v for k, v in get_all_subfields(line)]
+    return {'edition_name': ' '.join(found)}
+
+@deprecated(REASON)
+def read_publisher(fields):
+    if '260' not in fields:
+        return {}
+    publisher = []
+    publish_place = []
+    for line in fields['260']:
+        contents = get_contents(line, ['a', 'b'])
+        if 'b' in contents:
+            publisher += [x.strip(" /,;:") for x in contents['b']]
+        if 'a' in contents:
+            publish_place += [x.strip(" /.,;:") for x in contents['a']]
+    edition = {}
+    if publisher:
+        edition["publishers"] = publisher
+    if publish_place:
+        edition["publish_places"] = publish_place
+    return edition
+
+@deprecated(REASON)
+def read_pagination(fields):
+    if '300' not in fields:
+        return {}
+
+    pagination = []
+    edition = {}
+    for line in fields['300']:
+        pagination += get_subfield_values(line, ['a'])
+    if pagination:
+        edition["pagination"] = ' '.join(pagination)
+        num = [] # http://openlibrary.org/show-marc/marc_university_of_toronto/uoft.marc:2617696:825
+        for x in pagination:
+            num += [ int(i) for i in re_int.findall(x.replace(',',''))]
+            num += [ int(i) for i in re_int.findall(x) ]
+        valid = [i for i in num if i < max_number_of_pages]
+        if valid:
+            edition["number_of_pages"] = max(valid)
+    return edition
+
+@deprecated(REASON)
+def read_series(fields):
+    found = []
+    for tag in ('440', '490', '830'):
+        if tag not in fields:
+            continue
+        for line in fields[tag]:
+            this = []
+            for k, v in get_subfields(line, ['a', 'v']):
+                if k == 'v' and v:
+                    this.append(v)
+                    continue
+                v = v.rstrip('.,; ')
+                m = re_series.match(v)
+                if m:
+                    v = m.group(1)
+                if v:
+                    this.append(v)
+            if this:
+                s = ' -- '.join(this)
+                if s not in found:
+                    found.append(s)
+    return {'series': found} if found else {}
+
+@deprecated(REASON)
+def read_contributions(fields):
+    want = [
+        ('700', 'abcde'),
+        ('710', 'ab'),
+        ('711', 'acdn'),
+    ]
+
+    found = []
+    for tag, subfields in want:
+        if tag not in fields:
+            continue
+        for line in fields[tag]:
+            found.append(join_subfield_values(line, subfields))
+    return { 'contributions': found } if found else {}
+
+@deprecated(REASON)
+def remove_duplicates(seq):
+    u = []
+    for x in seq:
+        if x not in u:
+            u.append(x)
+    return u
+
+@deprecated(REASON)
+def read_subjects(fields):
+    want = [
+        ('600', 'abcd'),
+        ('610', 'ab'),
+        ('630', 'acdegnpqst'),
+        ('650', 'a'),
+        ('651', 'a'),
+    ]
+
+    found = []
+    subdivision = ['v', 'x', 'y', 'z']
+
+    for tag, subfields in want:
+        if tag not in fields:
+            continue
+        for line in fields[tag]:
+            a = get_subfield_values(line, subdivision)
+            b = " -- ".join(get_subfield_values(line, subfields) + a)
+            found.append(b)
+
+    return {'subjects': found} if found else {}
+
+@deprecated(REASON)
+def read_genres(fields):
+    found = []
+    for tag in '600', '650', '651':
+        if tag not in fields:
+            continue
+        for line in fields[tag]:
+            found += get_subfield_values(line, ['v'])
+    return { 'genres': remove_duplicates(found) } if found else {}
+
+@deprecated(REASON)
+def read_translation(fields):
+    tag = '500'
+    if tag not in fields:
+        return {}
+    for line in fields[tag]:
+        for value in get_subfield_values(line, ['a']):
+            value = value.strip()
+            if not re_translation1.match(value):
+                continue
+            if value.startswith("Translation of the author's thesis"):
+                continue # not interested
+            m = re_translation2.match(value)
+            return { 'translation_of': m.group(2) }
+    return {}
+
+@deprecated(REASON)
+def read_notes(fields):
+    found = []
+    for tag in range(500,590):
+        if tag in (505, 520) or str(tag) not in fields:
+            continue
+        tag = str(tag)
+        for line in fields[tag]:
+            x = get_lower_subfields(line)
+            if x:
+                found.append(' '.join(x))
+    return {'notes': '\n\n'.join(found)} if found else {}
+
+@deprecated(REASON)
+def read_toc(fields):
+    if '505' not in fields:
+        return {}
+
+    toc = []
+    for line in fields['505']:
+        toc_line = []
+        for k, v in get_all_subfields(line):
+            if k == 'a':
+                toc_split = [i.strip() for i in v.split('--')]
+                if any(len(i) > 2048 for i in toc_split):
+                    toc_split = [i.strip() for i in v.split(' - ')]
+                # http://openlibrary.org/show-marc/marc_miami_univ_ohio/allbibs0036.out:3918815:7321
+                if any(len(i) > 2048 for i in toc_split):
+                    toc_split = [i.strip() for i in v.split('; ')]
+                # http://openlibrary.org/show-marc/marc_western_washington_univ/wwu_bibs.mrc_revrev.mrc:938969487:3862
+                if any(len(i) > 2048 for i in toc_split):
+                    toc_split = [i.strip() for i in v.split(' / ')]
+                assert isinstance(toc_split, list)
+                toc.extend(toc_split)
+                continue
+            if k == 't':
+                if toc_line:
+                    toc.append(' -- '.join(toc_line))
+                if (len(v) > 2048):
+                    toc_line = [i.strip() for i in v.strip('/').split('--')]
+                continue
+            toc_line.append(v.strip(' -'))
+        if toc_line:
+            toc.append('-- '.join(toc_line))
+    if not toc:
+        return {}
+    found = []
+    for i in toc:
+        if len(i) > 2048:
+            i = i.split('  ')
+            found.extend(i)
+        else:
+            found.append(i)
+    return { 'table_of_contents': found }
+
+@deprecated(REASON)
+def read_description(fields):
+    if '520' not in fields:
+        return {}
+    found = []
+    wrap = False
+    for line in fields['520']:
+        this = get_subfield_values(line, ['a'])
+        assert len(this) == 1
+        found += this
+        if line[-3:-1] == '++':
+            wrap = True
+        else:
+            wrap = False
+    return {'description': "\n\n".join(found) } if found else {}
+
+@deprecated(REASON)
+def read_other_titles(fields):
+    found = []
+
+    if '246' in fields:
+        for line in fields['246']:
+            title = join_subfield_values(line, ['a'])
+            if title not in found:
+                found.append(title)
+
+    if '730' in fields:
+        for line in fields['730']:
+            title = ' '.join(get_lower_subfields(line))
+            if title not in found:
+                found.append(title)
+
+    if '740' in fields:
+        for line in fields['740']:
+            title = join_subfield_values(line, ['a', 'p', 'n'])
+            if title not in found:
+                found.append(title)
+
+    return {"other_titles": found} if found else {}
+
+@deprecated(REASON)
+def read_location(fields):
+    if '852' not in fields:
+        return {}
+    found = []
+    for line in fields['852']:
+        found += [v for v in get_subfield_values(line, ['a']) if v]
+    return { 'location': found } if found else {}
+
+@deprecated(REASON)
+def read_url(fields):
+    if '856' not in fields:
+        return {}
+    found = []
+    for line in fields['856']:
+        found += get_subfield_values(line, ['u'])
+    return { 'uri': found } if found else {}
+
+@deprecated(REASON)
+def build_record(data):
+    fields = {}
+    for tag, line in handle_wrapped_lines(get_tag_lines(data, want)):
+        fields.setdefault(tag, []).append(line)
+
+    edition = {}
+    if len(fields['008']) != 1:
+        warn("There should be a single '008' field.")
+        return {}
+    f = fields['008'][0]
+    publish_date = str(f)[7:11]
+    if publish_date.isdigit():
+        edition["publish_date"] = publish_date
+    publish_country = str(f)[15:18]
+    if publish_country not in ('|||', '   '):
+        edition["publish_country"] = publish_country
+    lang = str(f)[35:38]
+    if lang not in ('   ', '|||'):
+        edition["languages"] = [{ 'key': '/l/' + lang }]
+    edition.update(read_lccn(fields))
+    edition.update(read_isbn(fields))
+    edition.update(read_oclc(fields))
+    edition.update(read_lc_classification(fields))
+    edition.update(read_dewey(fields))
+    edition.update(read_authors(fields))
+    edition.update(read_title(fields))
+    edition.update(read_genres(fields))
+    edition.update(read_subjects(fields))
+    edition.update(read_pagination(fields))
+    edition.update(read_series(fields))
+    edition.update(read_work_titles(fields))
+    edition.update(read_other_titles(fields))
+    edition.update(read_edition_name(fields))
+    edition.update(read_publisher(fields))
+    edition.update(read_contributions(fields))
+    edition.update(read_location(fields))
+    edition.update(read_url(fields))
+    edition.update(read_toc(fields))
+    edition.update(read_notes(fields))
+    edition.update(read_translation(fields))
+    edition.update(read_description(fields))
+    return edition
+
+def test_candide_by_voltaire():
+    bpl = open('test_data/bpl_0486266893').read()
+    lc = open('test_data/lc_1416500308').read()
+
+    fields = {}
+    want = [ '41', '490', '830' ]
+    for tag, line in handle_wrapped_lines(get_tag_lines(lc, want)):
+        fields.setdefault(tag, []).append(line)
+    assert read_series(fields) == {'series': [u'Enriched classics']}
+
+    fields = {}
+    want = [ '41', '490', '830' ]
+    for tag, line in handle_wrapped_lines(get_tag_lines(bpl, want)):
+        fields.setdefault(tag, []).append(line)
+    assert read_series(fields) == {'series': [u'Dover thrift editions']}
diff --git a/ia-legacy-importer/marc/cmdline.py b/ia-legacy-importer/marc/cmdline.py
new file mode 100644
index 00000000..c76f20a0
--- /dev/null
+++ b/ia-legacy-importer/marc/cmdline.py
@@ -0,0 +1,53 @@
+#!/usr/bin/python2.5
+from __future__ import print_function
+from openlibrary.catalog.marc.fast_parse import *
+from openlibrary.catalog.get_ia import get_from_archive
+import sys
+import codecs
+import re
+
+sys.stdout = codecs.getwriter('utf-8')(sys.stdout)
+
+re_subtag = re.compile('\x1f[^\x1b]')
+
+def fmt_subfields(line, is_marc8=False):
+    def bold(s):
+        return ''.join(c + "\b" + c for c in s)
+    assert line[-1] == '\x1e'
+
+    encode = {
+        'k': lambda s: bold('$%s' % s),
+        'v': lambda s: translate(s, leader_says_marc8=marc8),
+    }
+    return ''.join(encode[k](v) for k, v in split_line(line[2:-1]))
+    pos = 0
+    prev = None
+    subfields = []
+    for m in re_subtag.finditer(line[2:-1]):
+        if prev is None:
+            prev = m.start()
+            continue
+        subfields.append(line[prev+3:m.start()+2])
+        prev = m.start()
+    subfields.append(line[prev+3:-1])
+
+    return ''.join(' ' + bold('$' + i[0]) + ' ' + (translate(i[1:], leader_says_marc8=leader_says_marc8) if i else '') for i in subfields)
+
+def show_book(data):
+    is_marc8 = data[9] == ' '
+    print(('leader:', data[:24]))
+    for tag, line in get_all_tag_lines(data):
+        print((tag, repr(line)))
+        continue
+        if tag.startswith('00'):
+            print(tag, line[:-1])
+        else:
+            print(tag, line[0:2], fmt_subfields(line, is_marc8=is_marc8))
+
+if __name__ == '__main__':
+    source = sys.argv[1]
+    if ':' in source:
+        data = get_from_archive(source)
+    else:
+        data = open(source).read()
+    show_book(data)
diff --git a/ia-legacy-importer/marc/db/__init__.py b/ia-legacy-importer/marc/db/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/ia-legacy-importer/marc/db/by_author.py b/ia-legacy-importer/marc/db/by_author.py
new file mode 100644
index 00000000..930a8ac1
--- /dev/null
+++ b/ia-legacy-importer/marc/db/by_author.py
@@ -0,0 +1,166 @@
+#!/usr/bin/python2.5
+import web
+import re
+from catalog.utils.query import query_iter, withKey
+from web_marc_db import search_query, marc_data, esc
+from catalog.marc.fast_parse import get_all_subfields, get_tag_lines, get_first_tag, get_subfields
+from catalog.utils import pick_first_date, flip_name, author_dates_match
+from collections import defaultdict
+
+urls = (
+    '/', 'index'
+)
+
+def read_line(line, name):
+    if not line or '\x1fd' not in line:
+        return
+    subfields = tuple((k, v.strip(' /,;:')) for k, v in get_subfields(line, 'abcd'))
+    marc_name = ' '.join(v for k, v in subfields if k in 'abc')
+    flipped = flip_name(marc_name)
+    if marc_name != name and flipped != name:
+        return
+    d = pick_first_date(v for k, v in subfields if k in 'abcd')
+    dates = tuple(d.get(k, None) for k in ['birth_date', 'death_date', 'date'])
+    return (marc_name, flipped, dates)
+
+def data_from_marc(locs, name):
+    lines = defaultdict(list)
+    for loc in locs:
+        data = marc_data(loc)
+        line = read_line(get_first_tag(data, set(['100'])), name)
+        if line:
+            lines[line].append(loc)
+        for tag, line in get_tag_lines(data, set(['700'])):
+            line = read_line(line, name)
+            if line:
+                lines[line].append(loc)
+    return lines
+
+def author_search(name):
+    q = {
+        'type':'/type/author',
+        'name': name,
+        'birth_date': None,
+        'death_date': None,
+        'dates': None
+    }
+    return [a for a in query_iter(q) if a.get('birth_date', None) or a.get('death_date', None) or a.get('dates', None)]
+
+def search(author, name):
+    book_fields = ('title_prefix', 'title');
+    q = { 'type': '/type/edition', 'authors': author, 'title_prefix': None, 'title': None, 'isbn_10': None}
+    found = list(query_iter(q))
+    db_author = ''
+    names = set([name])
+    t = ''
+    books = []
+    for e in found:
+        locs = set()
+        for i in e['isbn_10'] or []:
+            locs.update(search_query('isbn', i))
+        if not locs:
+            books.append((e['key'], (e['title_prefix'] or '') + e['title'], None, []))
+            continue
+        found = data_from_marc(locs, name)
+        if len(found) != 1:
+            locs = []
+            for i in found.values():
+                locs.append(i)
+            books.append((e['key'], (e['title_prefix'] or '') + e['title'], None, locs))
+            continue
+        marc_author = found.keys()[0]
+        locs = found.values()[0]
+        names.update(marc_author[0:2])
+        books.append((e['key'], (e['title_prefix'] or '') + e['title'], marc_author, locs))
+
+    authors = []
+    names2 = set()
+    for n in names:
+        if ', ' in n:
+            continue
+        i = n.rfind(' ')
+        names2.add("%s, %s" % (n[i+1:], n[:i]))
+    names.update(names2)
+
+    for n in names:
+        for a in author_search(n):
+            authors.append(a)
+
+    for a in authors:
+        q = {
+            'type': '/type/edition',
+            'authors': a['key'],
+            'title_prefix': None,
+            'title': None,
+            'isbn_10': None
+        }
+        a['editions'] = list(query_iter(q))
+
+    author_map = {}
+
+    for key, title, a, locs in books:
+        t += '<tr><td><a href="http://openlibrary.org' + key + '">' + web.htmlquote(title) + '</a>'
+        t += '<br>' + ', '.join('<a href="http://openlibrary.org/show-marc/%s">%s</a>' % (i, i) for i in locs) + '</td>'
+#        t += '<td>' + web.htmlquote(repr(a[2])) + '</td>'
+        if a:
+            if a[2] not in author_map:
+                dates = {'birth_date': a[2][0], 'death_date': a[2][1], 'dates': a[2][2]}
+                db_match = [db for db in authors if author_dates_match(dates, db)]
+                author_map[a[2]] = db_match[0] if len(db_match) == 1 else None
+
+            match = author_map[a[2]]
+            if match:
+                t += '<td><a href="http://openlibrary.org%s">%s-%s</a></td>' % (match['key'], match['birth_date'] or '', match['death_date'] or '')
+            else:
+                t += '<td>%s-%s (no match)</td>' % (dates['birth_date'] or '', dates['death_date'] or '')
+        t += '</tr>\n'
+
+    ret = ''
+    if authors:
+        ret += '<ul>'
+        for a in authors:
+            ret += '<li><a href="http://openlibrary.org%s">%s</a> (%s-%s) %d editions' % (a['key'], web.htmlquote(name), a['birth_date'] or '', a['death_date'] or '', len(a['editions']))
+        ret += '</ul>'
+
+    return ret + '<table>' + t + '</table>'
+
+class index():
+    def GET(self):
+        web.header('Content-Type','text/html; charset=utf-8', unique=True)
+        input = web.input()
+        title = 'Tidy author'
+        if 'author' in input and input.author:
+            author = input.author
+            name = withKey(author)['name']
+            q_name = web.htmlquote(name)
+            title = q_name + ' - Tidy author'
+        else:
+            author = None
+        ret = "<html>\n<head>\n<title>%s</title>" % title
+
+        ret += '''
+<style>
+th { text-align: left }
+td { padding: 5px; background: #eee }
+</style>'''
+
+        ret += '</head><body><a name="top">'
+        ret += '<form name="main" method="get"><table><tr><td align="right">Author</td><td>'
+        if author:
+            ret += '<input type="text" name="author" value="%s">' % web.htmlquote(author)
+        else:
+            ret += '<input type="text" name="author">'
+        ret += '</td>'
+        ret += '<td><input type="submit" value="find"></td></tr>'
+        ret += '</table>'
+        ret += '</form>'
+        if author:
+            ret += 'Author: <a href="http://openlibrary.org%s">%s</a><br>' % (author, name)
+            ret += search(author, name)
+        ret += "</body></html>"
+        return ret
+
+app = web.application(urls, globals())
+
+if __name__ == "__main__":
+    app.run()
diff --git a/ia-legacy-importer/marc/db/db_index.py b/ia-legacy-importer/marc/db/db_index.py
new file mode 100644
index 00000000..77ca798d
--- /dev/null
+++ b/ia-legacy-importer/marc/db/db_index.py
@@ -0,0 +1,121 @@
+from __future__ import print_function
+from catalog.get_ia import read_marc_file
+from time import time
+from catalog.marc.fast_parse import index_fields, get_tag_lines
+import os
+import os.path
+import re
+from catalog.marc.all import all_files
+from catalog.read_rc import read_rc
+
+rc = read_rc()
+
+fields = ['title', 'oclc', 'isbn', 'lccn']
+
+out = dict((i, open(i, 'a')) for i in fields)
+rec_id = 0
+db_rec = open('recs', 'a')
+db_file = open('files', 'a')
+file_id = 0
+
+re_escape = re.compile(r'[\n\r\t\0\\]')
+trans = { '\n': '\\n', '\r': '\\r', '\t': '\\t', '\\': '\\\\', '\0': '', }
+
+def esc_group(m):
+    return trans[m.group(0)]
+def esc(str): return re_escape.sub(esc_group, str)
+
+def add_to_index(fh, value, key):
+    if not value:
+        return
+    try:
+        value = str(value)
+    except UnicodeEncodeError:
+        return
+    print("\t".join([key, esc(value)]), file=fh)
+
+def process_record(pos, loc, data, file_id):
+    global rec_id
+    want = [
+#        '006', # Material Characteristics
+        '010', # LCCN
+        '020', # ISBN
+        '035', # OCLC
+#        '130', '240', # work title
+        '245', # title
+#        '246', '730', '740' # other titles
+    ]
+    try:
+        rec = index_fields(data, want, check_author = False)
+    except:
+        print(loc)
+        raise
+    if not rec:
+        return
+    field_size = { 'isbn': 16, 'oclc': 16, 'title': 25, 'lccn': 16 }
+    if 'isbn' in rec:
+        rec['isbn'] = [i for i in rec['isbn'] if len(i) <= 16]
+    if 'oclc' in rec:
+        rec['oclc'] = [i for i in rec['oclc'] if len(i) <= 16]
+    if 'lccn' in rec:
+        rec['lccn'] = [i for i in rec['lccn'] if len(i) <= 16]
+    for k, v in rec.iteritems():
+        if 'isbn' != k and any(len(i) > field_size[k] for i in v):
+            print(loc)
+            print(rec)
+            assert False
+    rec_id += 1
+    (f, p, l) = loc[5:].split(':')
+    print('\t'.join([str(rec_id), str(file_id), p, l]), file=db_rec)
+
+    for k, v in rec.iteritems():
+        if not v:
+            continue
+        for i in v:
+            add_to_index(out[k], i, str(rec_id))
+
+def progress_update(rec_no, t):
+    remaining = total - rec_no
+    rec_per_sec = chunk / t
+    mins = (float((t/chunk) * remaining) / 60)
+    print("%d %.3f rec/sec" % (rec_no, rec_per_sec), end=' ')
+    if mins > 1440:
+        print("%.3f days left" % (mins / 1440))
+    elif mins > 60:
+        print("%.3f hours left" % (mins / 60))
+    else:
+        print("%.3f minutes left" % mins)
+
+t_prev = time()
+rec_no = 0
+chunk = 10000
+total = 32856039
+
+
+for name, part, size in all_files():
+    f = open(name)
+    print(part)
+    file_id += 1
+    print(file_id, part, size)
+    print('\t'.join([str(file_id), part]), file=db_file)
+    filename = rc['marc_path'] + '/' + part
+    if not os.path.exists(filename):
+        print(filename, 'missing')
+    #    continue
+    assert os.path.exists(filename)
+    f = open(filename)
+    for pos, loc, data in read_marc_file(part, f):
+        rec_no +=1
+        if rec_no % chunk == 0:
+            t = time() - t_prev
+            progress_update(rec_no, t)
+            t_prev = time()
+        process_record(pos, loc, data, file_id)
+
+db_file.close()
+db_rec.close()
+
+print("closing files")
+for v in out.values():
+    v.close()
+print("finished")
diff --git a/ia-legacy-importer/marc/db/find_bad_isbn.py b/ia-legacy-importer/marc/db/find_bad_isbn.py
new file mode 100644
index 00000000..18c10d4d
--- /dev/null
+++ b/ia-legacy-importer/marc/db/find_bad_isbn.py
@@ -0,0 +1,106 @@
+from __future__ import print_function
+#from catalog.get_ia import *
+from catalog.get_ia import read_marc_file
+from catalog.read_rc import read_rc
+#from sources import sources
+from time import time
+from catalog.marc.fast_parse import index_fields, get_tag_lines
+import web
+import os
+import os.path
+import re
+
+# build an index of ISBN to MARC records
+
+rc = read_rc()
+web.config.db_parameters = dict(dbn='postgres', db='ol_merge', user=rc['user'], pw=rc['pw'], host=rc['host'])
+web.config.db_printing = False
+web.load()
+
+def process_record(pos, loc, data):
+    global rec_id
+    want = [
+#        '006', # Material Characteristics
+#        '010', # LCCN
+        '020', # ISBN
+#        '035', # OCLC
+#        '130', '240', # work title
+#        '245', # title
+#        '246', '730', '740' # other titles
+    ]
+    rec = index_fields(data, want, check_author = False)
+    field_size = { 'isbn': 16, 'oclc': 16, 'title': 25, 'lccn': 16 }
+    if not rec or 'isbn' not in rec:
+        return
+    for isbn in rec['isbn']:
+        if ';' in isbn:
+            print(loc)
+            print(rec)
+        assert ';' not in isbn
+    too_long = any(len(i) > 16 for i in rec['isbn'])
+    if not too_long:
+        return
+    print(loc)
+    print(rec)
+    assert not too_long
+
+    for a, length in field_size:
+        if a not in rec:
+            continue
+        too_long = any(len(i) > size for i in rec[a])
+        if not too_long:
+            continue
+        print(loc)
+        print(rec)
+        assert too_long
+#    rec = list(get_tag_lines(data, want))
+    return
+
+def progress_update(rec_no, t):
+    remaining = total - rec_no
+    rec_per_sec = chunk / t
+    mins = (float((t/chunk) * remaining) / 60)
+    print("%d %.3f rec/sec" % (rec_no, rec_per_sec), end=' ')
+    if mins > 1440:
+        print("%.3f days left" % (mins / 1440))
+    elif mins > 60:
+        print("%.3f hours left" % (mins / 60))
+    else:
+        print("%.3f minutes left" % mins)
+
+t_prev = time()
+rec_no = 0
+chunk = 1000
+total = 32856039
+
+def sources():
+    return ((i.id, i.archive_id, i.name) for i in web.select('marc_source'))
+
+def files(ia):
+    dir = rc['marc_path'] + ia
+    dir_len = len(dir) + 1
+    files = []
+    for dirpath, dirnames, filenames in os.walk(dir):
+        files.extend(dirpath + "/" + f for f in sorted(filenames))
+    return [(i[dir_len:], os.path.getsize(i)) for i in files]
+
+for source_id, ia, name in sources():
+    print()
+    print(source_id, ia, name)
+    for part, size in files(ia):
+        print(ia, part, size)
+        full_part = ia + "/" + part
+        filename = rc['marc_path'] + full_part
+        if not os.path.exists(filename):
+            print(filename, 'missing')
+        #    continue
+        assert os.path.exists(filename)
+        f = open(filename)
+        for pos, loc, data in read_marc_file(full_part, f):
+            rec_no +=1
+            if rec_no % chunk == 0:
+                t = time() - t_prev
+                progress_update(rec_no, t)
+                t_prev = time()
+            process_record(pos, loc, data)
+
diff --git a/ia-legacy-importer/marc/db/isbn_index.py b/ia-legacy-importer/marc/db/isbn_index.py
new file mode 100644
index 00000000..f5416fd9
--- /dev/null
+++ b/ia-legacy-importer/marc/db/isbn_index.py
@@ -0,0 +1,76 @@
+from __future__ import print_function
+from catalog.get_ia import *
+from catalog.read_rc import read_rc
+from catalog.marc.sources import sources
+from time import time
+from catalog.marc.fast_parse import index_fields
+import dbhash
+
+# build an index of ISBN to MARC records
+
+rc = read_rc()
+#db = dbhash.open(rc['index_path'] + 'isbn_to_marc.dbm', 'w')
+oclc_db = dbhash.open(rc['index_path'] + 'oclc.dbm', 'w')
+title_db = dbhash.open(rc['index_path'] + 'title.dbm', 'w')
+
+def add_to_db(db, isbn, loc):
+    if isbn in db:
+        db[isbn] += ' ' + loc
+    else:
+        db[isbn] = loc
+
+def process_record(pos, loc, data):
+    rec = index_fields(data, ['010'])
+    if not rec:
+        return
+    for isbn in rec.get('oclc', []):
+        try:
+            add_to_db(oclc_db, str(isbn), loc)
+        except (KeyboardInterrupt, NameError):
+            raise
+        except:
+            pass
+    for isbn in rec.get('title', []):
+        try:
+            add_to_db(title_db, str(isbn), loc)
+        except (KeyboardInterrupt, NameError):
+            raise
+        except:
+            pass
+
+def progress_update(rec_no, t):
+    remaining = total - rec_no
+    rec_per_sec = chunk / t
+    mins = (float((t/chunk) * remaining) / 60)
+    print("isbn %d %.3f rec/sec" % (rec_no, rec_per_sec), end=' ')
+    if mins > 1440:
+        print("%.3f days left" % (mins / 1440))
+    elif mins > 60:
+        print("%.3f hours left" % (mins / 60))
+    else:
+        print("%.3f minutes left" % mins)
+
+t_prev = time()
+rec_no = 0
+chunk = 1000
+total = 32856039
+
+for ia, name in sources():
+    print(ia, name)
+    for part, size in files(ia):
+        print(part, size)
+        full_part = ia + "/" + part
+        filename = rc['marc_path'] + full_part
+        if not os.path.exists(filename):
+            continue
+        f = open(filename)
+        for pos, loc, data in read_marc_file(full_part, f):
+            rec_no +=1
+            if rec_no % chunk == 0:
+                t = time() - t_prev
+                progress_update(rec_no, t)
+                t_prev = time()
+            process_record(pos, loc, data)
+
+title_db.close()
+oclc_db.close()
diff --git a/ia-legacy-importer/marc/db/lookup.py b/ia-legacy-importer/marc/db/lookup.py
new file mode 100644
index 00000000..8364425b
--- /dev/null
+++ b/ia-legacy-importer/marc/db/lookup.py
@@ -0,0 +1,12 @@
+from __future__ import print_function
+import dbhash
+import sys
+from catalog.read_rc import read_rc
+
+rc = read_rc()
+db = dbhash.open(rc['index_path'] + 'isbn_to_marc.dbm', 'r')
+isbn = sys.argv[1]
+if isbn in db:
+    print(db[isbn])
+else:
+    print(isbn, 'not found')
diff --git a/ia-legacy-importer/marc/db/web_author.py b/ia-legacy-importer/marc/db/web_author.py
new file mode 100644
index 00000000..acfece59
--- /dev/null
+++ b/ia-legacy-importer/marc/db/web_author.py
@@ -0,0 +1,98 @@
+from __future__ import print_function
+import web
+import dbhash
+import re
+from catalog.infostore import get_site
+from catalog.get_ia import get_data
+from catalog.read_rc import read_rc
+from catalog.marc.build_record import build_record
+from catalog.marc.fast_parse import get_all_subfields, get_tag_lines, get_first_tag, get_subfields
+
+import six
+
+
+trans = {'&':'amp','<':'lt','>':'gt'}
+re_html_replace = re.compile('([&<>])')
+
+def esc(s):
+    if not isinstance(s, six.string_types):
+        return s
+    return re_html_replace.sub(lambda m: "&%s;" % trans[m.group(1)], s.encode('utf8')).replace('\n', '<br>')
+
+data_cache = {}
+def marc_data(loc):
+    if loc not in data_cache:
+        data_cache[loc] = get_data(loc)
+    return data_cache[loc]
+
+def marc_authors(data):
+    line = get_first_tag(data, set(['100', '110', '111']))
+    return ''.join("<b>$%s</b>%s" % (esc(k), esc(v)) for k, v in get_all_subfields(line)) if line else None
+
+def marc_publisher(data):
+    line = get_first_tag(data, set(['260']))
+    return ''.join("<b>$%s</b>%s" % (esc(k), esc(v)) for k, v in get_all_subfields(line)) if line else None
+
+def marc_title(data):
+    line = get_first_tag(data, set(['245']))
+    return ''.join("<b>$%s</b>%s" % (esc(k), esc(v)) for k, v in get_subfields(line, set(['a', 'b', 'c']))) if line else None
+
+def marc_by_statement(data):
+    line = get_first_tag(data, set(['245']))
+    return ''.join("<b>$%s</b>%s" % (esc(k), esc(v)) for k, v in get_subfields(line, set(['c']))) if line else None
+
+
+
+rc = read_rc()
+
+urls = (
+    '/', 'index'
+)
+
+site = get_site()
+
+db_isbn = dbhash.open(rc['index_path'] + 'isbn_to_marc.dbm', 'r')
+
+def marc_table(l):
+    print('<table>')
+    print('<tr><td colspan="2">', l, "</td></tr>")
+    data = marc_data(l)
+    print('<tr><td>MARC author</td><td>', marc_authors(data), '</td></tr>')
+    print('<tr><td>MARC by statement</td><td>', marc_by_statement(data), '</td></tr>')
+    print('</table>')
+
+
+class index:
+    def GET(self):
+        web.header('Content-Type','text/html; charset=utf-8', unique=True)
+        key = web.input().author
+        thing = site.get(key)
+        title = ' - '.join([thing.name, key, 'Split author'])
+        print("<html>\n<head>\n<title>%s</title>" % title)
+        print('''
+<style>
+th { text-align: left }
+td { padding: 5px; background: #eee; vertical-align: top }
+</style>''')
+
+        print('</head><body><a name="top">')
+        print(thing.name, '<p>')
+        for k in site.things({'type': '/type/edition', 'authors': key}):
+            t = site.get(k)
+            print('<a href="http://openlibrary.org%s">%s</a></td>' % (k, t.title))
+            if t.isbn_10:
+                isbn = str(t.isbn_10[0])
+                locs = db_isbn[isbn].split(' ') if isbn in db_isbn else []
+                print('(ISBN: <a href="http://wiki-beta.us.archive.org:8081/?isbn=%s">%s</a> <a href="http://amazon.com/dp/%s">Amazon</a>)' % (isbn, isbn, isbn))
+            else:
+                isbn = None
+                locs = []
+            if locs:
+                for l in locs:
+                    marc_table(l)
+            print('<p>')
+        print('<body><html>')
+
+if __name__ == "__main__":
+    web.run(urls, globals(), web.reloader)
+
diff --git a/ia-legacy-importer/marc/db/web_marc_db.py b/ia-legacy-importer/marc/db/web_marc_db.py
new file mode 100644
index 00000000..3011e9bf
--- /dev/null
+++ b/ia-legacy-importer/marc/db/web_marc_db.py
@@ -0,0 +1,155 @@
+from __future__ import print_function
+# lookup MARC records and show details on the web
+from catalog.read_rc import read_rc
+from catalog.get_ia import get_data
+from catalog.marc.build_record import build_record
+from catalog.marc.fast_parse import get_all_subfields, get_tag_lines, get_first_tag, get_subfields
+from openlibrary.catalog.utils import cmp
+import re
+import sys
+import os.path
+import web
+from catalog.amazon.other_editions import find_others
+from catalog.utils import strip_count
+
+import six
+
+
+db = web.database(dbn='postgres', db='marc_lookup')
+db.printing = False
+
+trans = {'&':'amp','<':'lt','>':'gt'}
+re_html_replace = re.compile('([&<>])')
+
+def marc_authors(data):
+    line = get_first_tag(data, set(['100', '110', '111']))
+    return ''.join("<b>$%s</b>%s" % (esc(k), esc(v)) for k, v in get_all_subfields(line)) if line else None
+
+def marc_publisher(data):
+    line = get_first_tag(data, set(['260']))
+    return ''.join("<b>$%s</b>%s" % (esc(k), esc(v)) for k, v in get_all_subfield)
+
+def marc_title(data):
+    line = get_first_tag(data, set(['245']))
+    return ''.join("<b>$%s</b>%s" % (esc(k), esc(v)) for k, v in get_subfields(line, set(['a', 'b']))) if line else None
+
+def find_isbn_file():
+    for p in sys.path:
+        f = p + "/catalog/isbn"
+        if os.path.exists(f):
+            return f
+
+#isbn_file = find_isbn_file()
+#isbn_count = os.path.getsize(isbn_file) / 11
+
+def list_to_html(l):
+    def blue(s):
+        return ' <span style="color:blue; font-weight:bold">%s</span> ' % s
+    return blue('[') + blue('|').join(l) + blue(']')
+
+def esc(s):
+    if not isinstance(s, six.string_types):
+        return s
+    return re_html_replace.sub(lambda m: "&%s;" % trans[m.group(1)], s.encode('utf8')).replace('\n', '<br>')
+
+data_cache = {}
+def marc_data(loc):
+    if loc not in data_cache:
+        data_cache[loc] = get_data(loc)
+    return data_cache[loc]
+
+def counts_html(v):
+    count = {}
+    lens = [len(i) for i, loc in v if i and isinstance(i, six.string_types)]
+    sep = '<br>' if lens and max(lens) > 20 else ' '
+    for i, loc in v:
+        count.setdefault(i, []).append(loc)
+    s = sorted(count.iteritems(), cmp=lambda x,y: cmp(len(y[1]), len(x[1]) ))
+    s = strip_count(s)
+    return sep.join('<b>%d</b>: <span title="%s">%s</span>' % (len(loc), repr(loc), value if value else '<em>empty</em>') for value, loc in s)
+
+def list_works(this_isbn):
+    works = find_others(this_isbn, rc['amazon_other_editions'])
+    print('<a name="work">')
+    print('<h2>Other editions of the same work</h2>')
+    if not works:
+        print('no work found')
+        return
+    print('<table>')
+    print('<tr><th>ISBN</th><th>Amazon edition</th><th></th><th>MARC titles</th></tr>')
+    for isbn, note in works:
+        if note.lower().find('audio') != -1:
+            continue
+        locs = db_isbn[isbn].split(' ') if isbn in db_isbn else []
+#        titles = [read_full_title(get_first_tag(marc_data(i), set(['245'])), accept_sound = True) for i in locs]
+        titles = [(marc_title(marc_data(i)), i) for i in locs]
+        num = len(locs)
+        #print '<tr><td><a href="/?isbn=%s">%s</a></td><td>%s</td><td>%d</td><td>%s</td></tr>' % (isbn, isbn, note, len(locs), list_to_html(titles))
+        print('<tr><td><a href="/?isbn=%s">%s</a></td><td>%s</td><td>%d</td><td>' % (isbn, isbn, note, len(locs)))
+        print(counts_html(titles))
+        print('</td></tr>')
+    print('</table>')
+
+def most_freq_isbn(input):
+    counts = {}
+    for a in input:
+        if a:
+            for b in a[0]:
+                counts[b] = counts.get(b, 0) + 1
+    return max(counts, key=counts.get)
+
+def show_locs(locs, isbn):
+    recs = [(loc, build_record(marc_data(loc))) for loc in locs]
+    keys = set()
+    ret = "records found from %d libraries<br>" % len(recs)
+    ret += '<ul>'
+    for loc, rec in recs:
+        s = loc[:loc.find('/')]
+        ret += '<li><a href="http://openlibrary.org/show-marc/%s">%s</a>' % (loc, s)
+        keys.update([k for k in rec.keys()])
+        for f in 'uri':
+            if f in rec:
+                del rec[f]
+    ret += '</ul>'
+    keys -= set(['uri'])
+    ret += '<table>'
+    first_key = True
+    first = []
+    for f in ['isbn_10', 'title', 'subtitle', 'by_statement', 'authors', 'contributions']:
+        if f in keys:
+            first += [f]
+            keys -= set([f])
+    for k in first + list(keys):
+        v = [(rec.get(k, None), loc) for loc, rec in recs]
+#        if k == 'isbn_10' and not isbn and v:
+#            isbn = most_freq_isbn(v)
+        if k == 'languages':
+            v = [([ i['key'][3:] for i in l ] if l else None, loc) for l, loc in v]
+        if all(i is None or (isinstance(i, list) and len(i) == 1) for i, loc in v):
+            v = [ (i[0] if i else None, loc) for i, loc in v]
+
+        ret += '<tr><th valign="top">%s</th><td>' % k
+        if any(isinstance(i, list) or isinstance(i, dict) for i, loc in v):
+            if k == 'authors': # easiest to switch to raw MARC display
+                v = [(marc_authors(marc_data(loc)), loc) for i, loc in v ]
+            elif k == 'isbn_10':
+                v = [ (list_to_html(sorted(i)), loc) if i else (None, loc) for i, loc in v]
+            else:
+                v = [ (list_to_html(i), loc) if i else (None, loc) for i, loc in v]
+        else:
+            v = [ (esc(i), loc) for i, loc in v]
+#        print repr([i[0] for i in v]), '<br>'
+        ret += counts_html(v)
+        if isbn and first_key:
+            ret += '<td valign="top" rowspan="%d"><img src="https://covers.openlibrary.org/b/isbn/%s-L.jpg">' % (len(first) + len(keys), isbn)
+            first_key = False
+        ret += '</td></tr>'
+    ret += '</table>'
+    return ret
+
+def search_query(field, value):
+    sql = 'select part, pos, len ' \
+        + 'from files, recs, ' + field \
+        + ' where ' + field + '.rec=recs.id and recs.marc_file=files.id and value=$v'
+    iter = db.query(sql, {'v': value})
+    return [':'.join([i.part.strip(), str(i.pos), str(i.len)]) for i in iter]
diff --git a/ia-legacy-importer/marc/db/web_ui.py b/ia-legacy-importer/marc/db/web_ui.py
new file mode 100755
index 00000000..378e7ae6
--- /dev/null
+++ b/ia-legacy-importer/marc/db/web_ui.py
@@ -0,0 +1,104 @@
+#!/usr/bin/python2.5
+from __future__ import print_function
+import random
+import web
+from web_marc_db import search_query, show_locs
+
+# too slow
+#def random_isbn():
+#    sql = "select value from isbn order by random() limit 1"
+#    return list(web.query(sql))[0].value
+
+isbn_file = '../../isbn'
+isbn_count = 9093242
+
+def random_isbn():
+    f = open(isbn_file)
+    while True:
+        f.seek(random.randrange(isbn_count) * 11)
+        isbn = f.read(10)
+        break
+        found = list(web.select('isbn', where='value=$v', vars={'v':isbn}))
+        if found > 1:
+            break
+    f.close()
+    return isbn
+
+def search(field, value):
+    locs = search_query(field, value)
+    print(locs)
+    if locs:
+        return show_locs(locs, value if field == 'isbn' else None)
+    else:
+        return value + ' not found'
+
+urls = (
+    '/random', 'rand',
+    '/', 'index'
+)
+
+class rand():
+    def GET(self):
+        isbn = random_isbn()
+        web.redirect('/?isbn=' + isbn)
+
+class index():
+    def GET(self):
+        web.header('Content-Type','text/html; charset=utf-8', unique=True)
+        input = web.input()
+        lccn = None
+        oclc = None
+        isbn = None
+        title = 'MARC lookup'
+        if 'isbn' in input and input.isbn:
+            isbn = input.isbn
+            if isbn == 'random':
+                isbn = random_isbn()
+            title = 'MARC lookup: isbn=' + isbn
+        if 'lccn' in input and input.lccn:
+            lccn = input.lccn
+            title = 'MARC lookup: lccn=' + lccn
+        if 'oclc' in input and input.oclc:
+            oclc = input.oclc
+            title = 'MARC lookup: oclc=' + oclc
+        ret = "<html>\n<head>\n<title>%s</title>" % title
+        ret += '''
+<style>
+th { text-align: left }
+td { padding: 5px; background: #eee }
+</style>'''
+
+        ret += '</head><body><a name="top">'
+        ret += '<form name="main" method="get"><table><tr><td align="right">ISBN</td><td>'
+        if isbn:
+            ret += '<input type="text" name="isbn" value="%s">' % web.htmlquote(isbn)
+        else:
+            ret += '<input type="text" name="isbn">'
+        ret += ' or <a href="/random">random</a><br>'
+        ret += '</td></tr><tr><td align="right">LCCN</td><td>'
+        if lccn:
+            ret += '<input type="text" name="lccn" value="%s">' % web.htmlquote(lccn)
+        else:
+            ret += '<input type="text" name="lccn">'
+        ret += '</td></tr><tr><td align="right">OCLC</td><td>'
+        if oclc:
+            ret += '<input type="text" name="oclc" value="%s">' % web.htmlquote(oclc)
+        else:
+            ret += '<input type="text" name="oclc">'
+        ret += '</td></tr>'
+        ret += '<tr><td></td><td><input type="submit" value="find"></td></tr>'
+        ret += '</table>'
+        ret += '</form>'
+        if isbn:
+            ret += search('isbn', isbn)
+        elif lccn:
+            search('lccn', lccn)
+        elif oclc:
+            search('oclc', oclc)
+        ret += "</body></html>"
+        return ret
+
+app = web.application(urls, globals())
+
+if __name__ == "__main__":
+    app.run()
diff --git a/ia-legacy-importer/marc/download.py b/ia-legacy-importer/marc/download.py
new file mode 100644
index 00000000..18f944b6
--- /dev/null
+++ b/ia-legacy-importer/marc/download.py
@@ -0,0 +1,129 @@
+#!/usr/bin/python
+# downloader so Karen doesn't need to download entire MARC files
+from __future__ import print_function
+import web
+import web.form as form
+
+from six.moves import urllib
+
+
+urls = (
+    '/', 'index',
+    '/(bpl\d+\.mrc):(\d+):(\d+)', 'get',
+)
+
+files = (
+    ('bpl101.mrc', 50000),
+    ('bpl102.mrc', 50000),
+    ('bpl103.mrc', 50000),
+    ('bpl104.mrc', 50000),
+    ('bpl105.mrc', 50000),
+    ('bpl106.mrc', 50000),
+    ('bpl107.mrc', 50000),
+    ('bpl108.mrc', 50000),
+    ('bpl109.mrc', 50000),
+    ('bpl110.mrc', 50000),
+    ('bpl111.mrc', 50000),
+    ('bpl112.mrc', 50000),
+    ('bpl113.mrc', 50000),
+    ('bpl114.mrc', 50000),
+    ('bpl115.mrc', 50000),
+    ('bpl116.mrc', 50000),
+    ('bpl117.mrc', 50000),
+    ('bpl118.mrc', 49997),
+    ('bpl119.mrc', 50000),
+    ('bpl120.mrc', 50000),
+    ('bpl121.mrc', 50000),
+    ('bpl122.mrc', 49999),
+    ('bpl123.mrc', 50000),
+    ('bpl124.mrc', 50000),
+    ('bpl125.mrc', 50000),
+    ('bpl126.mrc', 50000),
+    ('bpl127.mrc', 50000),
+    ('bpl128.mrc', 49999),
+    ('bpl129.mrc', 49999),
+    ('bpl130.mrc', 50000),
+    ('bpl131.mrc', 49999),
+    ('bpl132.mrc', 50000),
+    ('bpl133.mrc', 50000),
+    ('bpl134.mrc', 49999),
+    ('bpl135.mrc', 50000),
+    ('bpl136.mrc', 50000),
+    ('bpl137.mrc', 49999),
+    ('bpl138.mrc', 50000),
+    ('bpl139.mrc', 50000),
+    ('bpl140.mrc', 50000),
+    ('bpl141.mrc', 50000),
+    ('bpl142.mrc', 50000),
+    ('bpl143.mrc', 50000),
+    ('bpl144.mrc', 50000),
+    ('bpl145.mrc', 50000),
+    ('bpl146.mrc', 50000),
+    ('bpl147.mrc', 41036),
+)
+
+myform = form.Form(
+    form.Dropdown('file', [(i, "%s - %d records" % (i, j)) for i, j in files]),
+    form.Textbox("start",
+        form.notnull,
+        form.regexp('\d+', 'Must be a digit'),
+        form.Validator('Must be less than 50000', lambda x:int(x)>50000)),
+    form.Textbox("count",
+        form.notnull,
+        form.regexp('\d+', 'Must be a digit'),
+        form.Validator('Must be less than 50000', lambda x:int(x)>50000)))
+
+def start_and_len(file, start, count):
+    f = urllib.request.urlopen("http://archive.org/download/bpl_marc/" + file)
+    pos = 0
+    num = 0
+    start_pos = None
+    while num < start + count:
+        data = f.read(5)
+        if data == '':
+            break
+        rec_len = int(data)
+        f.read(rec_len-5)
+        pos+=rec_len
+        num+=1
+        if num == start:
+            start_pos = pos
+
+    f.close()
+    return (start_pos, pos - start_pos)
+
+class index:
+    def GET(self):
+        this_form = myform()
+        this_form.fill()
+        print('<form name="main" method="get">')
+        if not this_form.valid:
+            print('<p class="error">Try again:</p>')
+        print(this_form.render())
+        print('<input type="submit"></form>')
+        if this_form['start'].value:
+            file = this_form['file'].value
+            (offset, length) = start_and_len(file, int(this_form['start'].value), int(this_form['count'].value))
+            print("%.1fKB" % (float(length) / 1024.0))
+            url = "http://wiki-beta.us.archive.org:9090/%s:%d:%d" % (file, offset, length)
+            print('<a href="%s">download</a>' % url)
+
+class get:
+    def GET(self, file, offset, length):
+        offset = int(offset)
+        length = int(length)
+        web.header("Content-Type","application/octet-stream")
+        r0, r1 = offset, offset+length-1
+        url = "http://archive.org/download/bpl_marc/" + file
+        ureq = urllib.request.Request(url, None, {'Range':'bytes=%d-%d'% (r0, r1)},)
+        f = urllib.request.urlopen(ureq)
+        while True:
+            buf = f.read(1024)
+            if not buf:
+                break
+            web.output(buf)
+        f.close()
+
+web.webapi.internalerror = web.debugerror
+
+if __name__ == "__main__": web.run(urls, globals(), web.reloader)
diff --git a/ia-legacy-importer/marc/fast_parse.py b/ia-legacy-importer/marc/fast_parse.py
new file mode 100644
index 00000000..09e0bcc3
--- /dev/null
+++ b/ia-legacy-importer/marc/fast_parse.py
@@ -0,0 +1,509 @@
+""" Deprecated module,
+    MARC parsing should be done by catalog.marc.parse instead.
+"""
+
+import re
+from deprecated import deprecated
+from pymarc import MARC8ToUnicode
+from unicodedata import normalize
+
+from openlibrary.catalog.marc import mnemonics
+from openlibrary.catalog.utils import tidy_isbn
+
+
+re_real_book = re.compile('(pbk|hardcover|alk[^a-z]paper|cloth)', re.I)
+
+@deprecated('Use openlibrary.catalog.marc.MarcBinary instead.')
+def translate(bytes_in, leader_says_marc8=False):
+    """
+    Converts MARC8 to unicode
+    """
+    marc8 = MARC8ToUnicode(quiet=True)
+    if leader_says_marc8:
+        data = marc8.translate(mnemonics.read(bytes_in))
+    else:
+        data = bytes_in.decode('utf-8')
+    return normalize('NFC', data)
+
+re_question = re.compile(r'^\?+$')
+re_lccn = re.compile(r'(...\d+).*')
+re_letters_and_bad = re.compile('[A-Za-z\x80-\xff]')
+re_int = re.compile (r'\d{2,}')
+re_isbn = re.compile(r'([^ ()]+[\dX])(?: \((?:v\. (\d+)(?: : )?)?(.*)\))?')
+re_oclc = re.compile (r'^\(OCoLC\).*?0*(\d+)')
+
+re_normalize = re.compile(r'[^\w ]')
+re_whitespace = re.compile(r'\s+')
+
+@deprecated
+def normalize_str(s):
+    s = re_normalize.sub('', s.strip())
+    s = re_whitespace.sub(' ', s)
+    return str(s.lower())
+
+# no monograph should be longer than 50,000 pages
+max_number_of_pages = 50000
+
+class InvalidMarcFile(Exception):
+    pass
+
+@deprecated('Use catalog.marc.parse instead.')
+def read_file(f):
+    """
+    Generator which seeks? for start of a MARC record and
+    returns the proper data and its length.
+
+    :param str f: Raw binary MARC data
+    :rtype: (str, int)
+    :return: Data, length
+    """
+    buf = None
+    while True:
+        if buf:
+            length = buf[:5]
+            int_length = int(length)
+        else:
+            length = f.read(5)
+            buf = length
+        if length == "":
+            break
+        if not length.isdigit():
+            raise InvalidMarcFile
+        int_length = int(length)
+        data = buf + f.read(int_length - len(buf))
+        buf = None
+        if not data.endswith("\x1e\x1d"):
+            # skip bad record, should warn somehow
+            end_index = data.rfind('\x1e\x1d')
+            if end_index != -1:
+                end = end_index + 2
+                yield (data[:end], end)
+                buf = data[end:]
+                continue
+        if data.find('\x1d') == -1:
+            data += f.read(40)
+            int_length = data.find('\x1d') + 1
+            assert int_length
+            buf = data[int_length:]
+            data = data[:int_length]
+        assert data.endswith("\x1e\x1d")
+        if len(data) < int_length:
+            break
+        yield (data, int_length)
+
+@deprecated
+def read_author_person(line, is_marc8=False):
+    name = []
+    name_and_date = []
+    for k, v in get_subfields(line, ['a', 'b', 'c', 'd'], is_marc8):
+        if k != 'd':
+            v = v.strip(' /,;:')
+            name.append(v)
+        name_and_date.append(v)
+    if not name:
+        return []
+
+    return [{ 'db_name': u' '.join(name_and_date), 'name': u' '.join(name), }]
+
+# exceptions:
+class SoundRecording(Exception):
+    pass
+
+class NotBook(Exception):
+    pass
+
+class BadDictionary(Exception):
+    pass
+
+@deprecated
+def read_title_and_subtitle(data, is_marc8=False):
+    line = get_first_tag(data, set(['245']))
+    contents = get_contents(line, ['a', 'b', 'c', 'h'], is_marc8)
+
+    title = None
+    if 'a' in contents:
+        title = ' '.join(x.strip(' /,;:') for x in contents['a'])
+    elif 'b' in contents:
+        title = contents['b'][0].strip(' /,;:')
+        del contents['b'][0]
+    subtitle = None
+    if 'b' in contents and contents['b']:
+        subtitle = ' : '.join([x.strip(' /,;:') for x in contents['b']])
+    return (title, subtitle)
+
+@deprecated
+def get_raw_subfields(line, want):
+    # no translate
+    want = set(want)
+    #assert line[2] == '\x1f'
+    for i in line[3:-1].split('\x1f'):
+        if i and i[0] in want:
+            yield i[0], i[1:]
+
+@deprecated('Use catalog.marc.MarcBinary instead.')
+def get_all_subfields(line, is_marc8=False):
+    for i in line[3:-1].split('\x1f'):
+        if i:
+            j = translate(i, is_marc8)
+            yield j[0], j[1:]
+
+@deprecated
+def get_subfields(line, want, is_marc8=False):
+    want = set(want)
+    #assert line[2] == '\x1f'
+    for i in line[3:-1].split('\x1f'):
+        if i and i[0] in want:
+            yield i[0], translate(i[1:], is_marc8)
+
+@deprecated('Use catalog.marc.MarcBinary instead.')
+def read_directory(data):
+    dir_end = data.find('\x1e')
+    if dir_end == -1:
+        raise BadDictionary
+    directory = data[24:dir_end]
+    if len(directory) % 12 != 0:
+        # directory is the wrong size
+        # sometimes the leader includes some utf-8 by mistake
+        directory = data[:dir_end].decode('utf-8')[24:]
+        if len(directory) % 12 != 0:
+            raise BadDictionary
+    iter_dir = (directory[i*12:(i+1)*12] for i in range(len(directory) / 12))
+    return dir_end, iter_dir
+
+@deprecated('Use catalog.marc.MarcBinary instead.')
+def get_tag_line(data, line):
+    length = int(line[3:7])
+    offset = int(line[7:12])
+
+    # handle off-by-one errors in MARC records
+    try:
+        if data[offset] != '\x1e':
+            offset += data[offset:].find('\x1e')
+        last = offset+length
+        if data[last] != '\x1e':
+            length += data[last:].find('\x1e')
+    except IndexError:
+        pass
+    tag_line = data[offset + 1:offset + length + 1]
+    if not line[0:2] == '00':
+        if tag_line[1:8] == '{llig}\x1f':
+            tag_line = tag_line[0] + u'\uFE20' + tag_line[7:]
+    return tag_line
+
+@deprecated
+def get_tag_lines(data, want):
+    want = set(want)
+    dir_end, iter_dir = read_directory(data)
+    data = data[dir_end:]
+    return [(line[:3], get_tag_line(data, line)) for line in iter_dir if line[:3] in want]
+
+@deprecated
+def get_all_tag_lines(data):
+    dir_end, iter_dir = read_directory(data)
+    data = data[dir_end:]
+    for line in iter_dir:
+        yield (line[:3], get_tag_line(data, line))
+
+@deprecated
+def get_first_tag(data, want): # return first line of wanted tag
+    dir_end, iter_dir = read_directory(data)
+    data = data[dir_end:]
+    for line in iter_dir:
+        if line[:3] in want:
+            return get_tag_line(data, line)
+
+re_dates = re.compile('^\(?(\d+-\d*|\d*-\d+)\)?$')
+
+@deprecated
+def get_person_content(line, is_marc8=False):
+    contents = {}
+    for k, v in get_subfields(line, ['a', 'b', 'c', 'd', 'q'], is_marc8):
+        if k != 'd' and re_dates.match(v): # wrong subtag
+            k = 'd'
+        contents.setdefault(k, []).append(v)
+    return contents
+
+@deprecated
+def get_contents(line, want, is_marc8=False):
+    contents = {}
+    for k, v in get_subfields(line, want, is_marc8):
+        contents.setdefault(k, []).append(v)
+    return contents
+
+@deprecated
+def get_lower_subfields(line, is_marc8=False):
+    if len(line) < 4:
+        return [] # http://openlibrary.org/show-marc/marc_university_of_toronto/uoft.marc:2479215:693
+    return [translate(i[1:], is_marc8) for i in line[3:-1].split('\x1f') if i and i[0].islower()]
+
+@deprecated
+def get_subfield_values(line, want, is_marc8=False):
+    return [v for k, v in get_subfields(line, want, is_marc8)]
+
+@deprecated
+def read_control_number(line, is_marc8=False):
+    assert line[-1] == '\x1e'
+    return [line[:-1]]
+
+@deprecated('Use catalog.marc.parse.read_lccn() instead.')
+def read_lccn(line, is_marc8=False):
+    found = []
+    for k, v in get_raw_subfields(line, ['a']):
+        lccn = v.strip()
+        if re_question.match(lccn):
+            continue
+        m = re_lccn.search(lccn)
+        if not m:
+            continue
+        # remove letters and bad chars
+        lccn = re_letters_and_bad.sub('', m.group(1)).strip()
+        if lccn:
+            found.append(lccn)
+    return found
+
+@deprecated('Use catalog.marc.parse.read_isbn() instead.')
+def read_isbn(line, is_marc8=False):
+    found = []
+    if line.find('\x1f') != -1:
+        for k, v in get_raw_subfields(line, ['a', 'z']):
+            m = re_isbn.match(v)
+            if m:
+                found.append(m.group(1))
+    else:
+        m = re_isbn.match(line[3:-1])
+        if m:
+            found = [m.group(1)]
+    return map(str, tidy_isbn(found))
+
+@deprecated('Use catalog.marc.parse.read_oclc() instead.')
+def read_oclc(line, is_marc8=False):
+    found = []
+    for k, v in get_raw_subfields(line, ['a']):
+        m = re_oclc.match(v)
+        if m:
+            found.append(m.group(1))
+    return found
+
+@deprecated
+def read_publisher(line, is_marc8=False):
+    return [i for i in (v.strip(' /,;:') for k, v in get_subfields(line, ['b'], is_marc8)) if i]
+
+@deprecated
+def read_author_org(line, is_marc8=False):
+    name = " ".join(v.strip(' /,;:') for k, v in get_subfields(line, ['a', 'b'], is_marc8))
+    return [{ 'name': name, 'db_name': name, }]
+
+@deprecated
+def read_author_event(line, is_marc8=False):
+    name = " ".join(v.strip(' /,;:') for k, v in get_subfields(line, ['a', 'b', 'd', 'n'], is_marc8))
+    return [{ 'name': name, 'db_name': name, }]
+
+@deprecated
+def add_oclc(edition):
+    if 'control_numer' not in edition:
+        return
+    oclc = edition['control_number'][0]
+    assert oclc.isdigit()
+    edition.setdefault('oclc', []).append(oclc)
+
+@deprecated
+def index_fields(data, want, check_author=True):
+    if str(data)[6:8] != 'am':  # only want books
+        return None
+    is_marc8 = data[9] != 'a'
+    edition = {}
+    author = {
+        '100': 'person',
+        '110': 'org',
+        '111': 'even',
+    }
+
+    if check_author:
+        want += author.keys()
+    fields = get_tag_lines(data, ['006', '008', '260'] + want)
+    read_tag = {
+        '001': (read_control_number, 'control_number'),
+        '010': (read_lccn, 'lccn'),
+        '020': (read_isbn, 'isbn'),
+        '035': (read_oclc, 'oclc'),
+        '245': (read_short_title, 'title'),
+    }
+
+    seen_008 = False
+    oclc_001 = False
+    is_real_book = False
+
+    tag_006_says_electric = False
+    for tag, line in fields:
+        if tag == '003': # control number identifier
+            if line.lower().startswith('ocolc'):
+                oclc_001 = True
+            continue
+        if tag == '006':
+            if line[0] == 'm': # don't want electronic resources
+                tag_006_says_electric = True
+            continue
+        if tag == '008':
+            if seen_008: # dup
+                return None
+            seen_008 = True
+            continue
+        if tag == '020' and re_real_book.search(line):
+            is_real_book = True
+        if tag == '260':
+            if line.find('\x1fh[sound') != -1: # sound recording
+                return None
+            continue
+
+        if tag in author:
+            if 'author' in edition:
+                return None
+            else:
+                edition['author'] = author[tag]
+            continue
+        assert tag in read_tag
+        proc, key = read_tag[tag]
+        try:
+            found = proc(line, is_marc8)
+        except SoundRecording:
+            return None
+        if found:
+            edition.setdefault(key, []).extend(found)
+    if oclc_001:
+        add_oclc(edition)
+    if 'control_number' in edition:
+        del edition['control_number']
+    if not seen_008:
+        return None
+#    if 'title' not in edition:
+#        return None
+    if tag_006_says_electric and not is_real_book:
+        return None
+    return edition
+
+@deprecated('Please use openlibrary.catalog.marc.parse.read_edition(MarcBinary|MarcXml).')
+def read_edition(data, accept_electronic=False):
+    """
+    DEPRECATED: Please use openlibrary.catalog.marc.parse.read_edition(MarcBinary|MarcXml)
+      Will error if data contains a 245 field.
+    Converts MARC Binary into a dict representation of an edition
+    suitable for importing into Open Library.
+
+    :param str data: Raw MARC Binary
+    :param bool accept_electronic: Accept ebooks. If False, this returns None when ebooks are encountered
+    :return: Edition representation
+    :rtype: dict|None
+    """
+    is_marc8 = data[9] != 'a'
+    edition = {}
+    want = ['001', '003', '006', '008', '010', '020', '035', \
+            '100', '110', '111', '700', '710', '711', '245', '260', '300']
+    fields = get_tag_lines(data, want)
+    read_tag = [
+        ('001', read_control_number, 'control_number'),
+        ('010', read_lccn, 'lccn'),
+        ('020', read_isbn, 'isbn'),
+        ('035', read_oclc, 'oclc'),
+        ('100', read_author_person, 'authors'),
+        ('110', read_author_org, 'authors'),
+        ('111', read_author_event, 'authors'),
+        ('700', read_author_person, 'contribs'),
+        ('710', read_author_org, 'contribs'),
+        ('711', read_author_event, 'contribs'),
+        ('260', read_publisher, 'publishers'),
+    ]
+
+    oclc_001 = False
+    tag_006_says_electric = False
+    is_real_book = False
+    for tag, line in fields:
+        if tag == '003': # control number identifier
+            if line.lower().startswith('ocolc'):
+                oclc_001 = True
+            continue
+        if tag == '006':
+            if line[0] == 'm':
+                tag_006_says_electric = True
+            continue
+        if tag == '008': # not interested in '19uu' for merge
+            #assert len(line) == 41 usually
+            if line[7:11].isdigit():
+                edition['publish_date'] = line[7:11]
+            edition['publish_country'] = line[15:18]
+            continue
+        if tag == '020' and re_real_book.search(line):
+            is_real_book = True
+        for t, proc, key in read_tag:
+            if t != tag:
+                continue
+            found = proc(line, is_marc8=is_marc8)
+            if found:
+                edition.setdefault(key, []).extend(found)
+            break
+        if tag == '245':
+            edition['full_title'] = read_full_title(line, is_marc8=is_marc8)
+            continue
+        if tag == '300':
+            for k, v in get_subfields(line, ['a'], is_marc8):
+                num = [ int(i) for i in re_int.findall(v) ]
+                num = [i for i in num if i < max_number_of_pages]
+                if not num:
+                    continue
+                max_page_num = max(num)
+                if 'number_of_pages' not in edition \
+                        or max_page_num > edition['number_of_pages']:
+                    edition['number_of_pages'] = max_page_num
+    if oclc_001:
+        add_oclc(edition)
+    if 'control_number' in edition:
+        del edition['control_number']
+    if not accept_electronic and tag_006_says_electric and not is_real_book:
+        return None
+
+    return edition
+
+@deprecated('Use catalog.marc.marc_binary.handle_wrapped_lines() instead.')
+def handle_wrapped_lines(iter):
+    cur_lines = []
+    cur_tag = None
+    maybe_wrap = False
+    for t, l in iter:
+        if len(l) > 500 and l.endswith('++\x1e'):
+            assert not cur_tag or cur_tag == t
+            cur_tag = t
+            cur_lines.append(l)
+            continue
+        if cur_lines:
+            yield cur_tag, cur_lines[0][:-3] + ''.join(i[2:-3] for i in cur_lines[1:]) + l[2:]
+            cur_tag = None
+            cur_lines = []
+            continue
+        yield t, l
+    assert not cur_lines
+
+@deprecated('Use catalog.marc.parse instead.')
+def split_line(s):
+    pos = -1
+    marks = []
+    while True:
+        pos = s.find('\x1f', pos + 1)
+        if pos == -1:
+            break
+        if s[pos+1] != '\x1b':
+            marks.append(pos)
+    if not marks:
+        return [('v', s)]
+
+    ret = []
+    if s[:marks[0]]:
+        ret.append(('v', s[:marks[0]]))
+    for i in range(len(marks)):
+        m = marks[i]
+        ret.append(('k', s[m+1:m+2]))
+        if len(marks) == i+1:
+            if s[m+2:]:
+                ret.append(('v', s[m+2:]))
+        else:
+            if s[m+2:marks[i+1]]:
+                ret.append(('v', s[m+2:marks[i+1]]))
+    return ret
diff --git a/ia-legacy-importer/marc/find_translation.py b/ia-legacy-importer/marc/find_translation.py
new file mode 100644
index 00000000..42a2729b
--- /dev/null
+++ b/ia-legacy-importer/marc/find_translation.py
@@ -0,0 +1,21 @@
+#!/usr/bin/python2.5
+from __future__ import print_function
+from catalog.marc.fast_parse import *
+import sys
+import codecs
+
+sys.stdout = codecs.getwriter('utf-8')(sys.stdout)
+
+for data, length in read_file(open(sys.argv[1])):
+    line = get_first_tag(data, set(['500']))
+    if not line:
+        continue
+    subtag, value = get_all_subfields(line).next()
+    if subtag != 'a':
+        continue
+    if value.startswith("Translation of the author's thesis"):
+        continue
+    start = value.lower().find('translation of')
+    if start == -1 or start > 6:
+        continue
+    print(value)
diff --git a/ia-legacy-importer/marc/get_subjects.py b/ia-legacy-importer/marc/get_subjects.py
new file mode 100644
index 00000000..ccf43395
--- /dev/null
+++ b/ia-legacy-importer/marc/get_subjects.py
@@ -0,0 +1,177 @@
+from collections import defaultdict
+import re
+from openlibrary.catalog.utils import remove_trailing_dot, flip_name
+
+re_flip_name = re.compile('^(.+), ([A-Z].+)$')
+
+# 'Rhodes, Dan (Fictitious character)'
+re_fictitious_character = re.compile(r'^(.+), (.+)( \(.* character\))$')
+re_etc = re.compile('^(.+?)[, .]+etc[, .]?$', re.I)
+re_comma = re.compile('^([A-Z])([A-Za-z ]+?) *, ([A-Z][A-Z a-z]+)$')
+
+re_place_comma = re.compile('^(.+), (.+)$')
+re_paren = re.compile('[()]')
+def flip_place(s):
+    s = remove_trailing_dot(s)
+    # Whitechapel (London, England)
+    # East End (London, England)
+    # Whitechapel (Londres, Inglaterra)
+    if re_paren.search(s):
+        return s
+    m = re_place_comma.match(s)
+    return m.group(2) + ' ' + m.group(1) if m else s
+
+def flip_subject(s):
+    m = re_comma.match(s)
+    if m:
+        return m.group(3) + ' ' + m.group(1).lower()+m.group(2)
+    else:
+        return s
+
+def tidy_subject(s):
+    s = s.strip()
+    if len(s) > 1:
+        s = s[0].upper() + s[1:]
+    m = re_etc.search(s)
+    if m:
+        return m.group(1)
+    s = remove_trailing_dot(s)
+    m = re_fictitious_character.match(s)
+    if m:
+        return m.group(2) + ' ' + m.group(1) + m.group(3)
+    m = re_comma.match(s)
+    if m:
+        return m.group(3) + ' ' + m.group(1) + m.group(2)
+    return s
+
+def four_types(i):
+    want = set(['subject', 'time', 'place', 'person'])
+    ret = dict((k, i[k]) for k in want if k in i)
+    for j in (j for j in i.keys() if j not in want):
+        for k, v in i[j].items():
+            if 'subject' in ret:
+                ret['subject'][k] = ret['subject'].get(k, 0) + v
+            else:
+                ret['subject'] = {k: v}
+    return ret
+
+re_aspects = re.compile(' [Aa]spects$')
+def find_aspects(f):
+    cur = [(i, j) for i, j in f.get_subfields('ax')]
+    if len(cur) < 2 or cur[0][0] != 'a' or cur[1][0] != 'x':
+        return
+    a, x = cur[0][1], cur[1][1]
+    x = x.strip('. ')
+    a = a.strip('. ')
+    if not re_aspects.search(x):
+        return
+    if a == 'Body, Human':
+        a = 'the Human body'
+    return x + ' of ' + flip_subject(a)
+
+subject_fields = set(['600', '610', '611', '630', '648', '650', '651', '662'])
+
+def read_subjects(rec):
+    subjects = defaultdict(lambda: defaultdict(int))
+    for tag, field in rec.read_fields(subject_fields):
+        f = rec.decode_field(field)
+        aspects = find_aspects(f)
+
+        if tag == '600': # people
+            name_and_date = []
+            for k, v in f.get_subfields(['a', 'b', 'c', 'd']):
+                v = '(' + v.strip('.() ') + ')' if k == 'd' else v.strip(' /,;:')
+                if k == 'a':
+                    m = re_flip_name.match(v)
+                    if m:
+                        v = flip_name(v)
+                name_and_date.append(v)
+            name = remove_trailing_dot(' '.join(name_and_date)).strip()
+            if name != '':
+                subjects['person'][name] += 1
+        elif tag == '610': # org
+            v = ' '.join(f.get_subfield_values('abcd'))
+            v = v.strip()
+            if v:
+                v = remove_trailing_dot(v).strip()
+            if v:
+                v = tidy_subject(v)
+            if v:
+                subjects['org'][v] += 1
+
+            for v in f.get_subfield_values('a'):
+                v = v.strip()
+                if v:
+                    v = remove_trailing_dot(v).strip()
+                if v:
+                    v = tidy_subject(v)
+                if v:
+                    subjects['org'][v] += 1
+        elif tag == '611': # event
+            v = ' '.join(j.strip() for i, j in f.get_all_subfields() if i not in 'vxyz')
+            if v:
+                v = v.strip()
+            v = tidy_subject(v)
+            if v:
+                subjects['event'][v] += 1
+        elif tag == '630': # work
+            for v in f.get_subfield_values(['a']):
+                v = v.strip()
+                if v:
+                    v = remove_trailing_dot(v).strip()
+                if v:
+                    v = tidy_subject(v)
+                if v:
+                    subjects['work'][v] += 1
+        elif tag == '650': # topical
+            for v in f.get_subfield_values(['a']):
+                if v:
+                    v = v.strip()
+                v = tidy_subject(v)
+                if v:
+                    subjects['subject'][v] += 1
+        elif tag == '651': # geo
+            for v in f.get_subfield_values(['a']):
+                if v:
+                    subjects['place'][flip_place(v).strip()] += 1
+
+        for v in f.get_subfield_values(['y']):
+            v = v.strip()
+            if v:
+                subjects['time'][remove_trailing_dot(v).strip()] += 1
+        for v in f.get_subfield_values(['v']):
+            v = v.strip()
+            if v:
+                v = remove_trailing_dot(v).strip()
+            v = tidy_subject(v)
+            if v:
+                subjects['subject'][v] += 1
+        for v in f.get_subfield_values(['z']):
+            v = v.strip()
+            if v:
+                subjects['place'][flip_place(v).strip()] += 1
+        for v in f.get_subfield_values(['x']):
+            v = v.strip()
+            if not v:
+                continue
+            if aspects and re_aspects.search(v):
+                continue
+            v = tidy_subject(v)
+            if v:
+                subjects['subject'][v] += 1
+
+    return dict((k, dict(v)) for k, v in subjects.items())
+
+def subjects_for_work(rec):
+    field_map = {
+        'subject': 'subjects',
+        'place': 'subject_places',
+        'time': 'subject_times',
+        'person': 'subject_people',
+    }
+
+    subjects = four_types(read_subjects(rec))
+
+    return dict((field_map[k], v.keys()) for k, v in subjects.items())
+
+
diff --git a/ia-legacy-importer/marc/has_001.py b/ia-legacy-importer/marc/has_001.py
new file mode 100644
index 00000000..d34f73b7
--- /dev/null
+++ b/ia-legacy-importer/marc/has_001.py
@@ -0,0 +1,38 @@
+#!/usr/bin/python2.5
+from __future__ import print_function
+from catalog.marc.fast_parse import *
+from catalog.read_rc import read_rc
+from catalog.get_ia import files
+from sources import sources
+import sys
+import os
+
+rc = read_rc()
+read_count = 10000
+
+show_bad_records = False
+
+for ia, name in sources(): # find which sources include '001' tag
+    has_001 = 0
+    rec_no = 0
+    for part, size in files(ia):
+        filename = rc['marc_path'] + ia + "/" + part
+        if not os.path.exists(filename):
+            continue
+        for data, length in read_file(open(filename)):
+            if rec_no == read_count:
+                break
+            rec_no += 1
+            if list(get_tag_lines(data, ['001'])):
+                has_001 += 1
+            elif show_bad_records:
+                print(data[:24])
+                for tag, line in get_all_tag_lines(data):
+                    if tag.startswith('00'):
+                        print(tag, line[:-1])
+                    else:
+                        print(tag, list(get_all_subfields(line)))
+        if rec_no == read_count:
+            break
+    print("%5d %s %s" % (has_001, ia, name))
+    continue
diff --git a/ia-legacy-importer/marc/html.py b/ia-legacy-importer/marc/html.py
new file mode 100644
index 00000000..a525825c
--- /dev/null
+++ b/ia-legacy-importer/marc/html.py
@@ -0,0 +1,55 @@
+from openlibrary.catalog.marc.fast_parse import get_all_tag_lines, translate, split_line
+import re
+
+trans = {'&':'&amp;','<':'&lt;','>':'&gt;','\n':'<br>', '\x1b': '<b>[esc]</b>'}
+re_html_replace = re.compile('([&<>\n\x1b])')
+
+def esc(s):
+    return re_html_replace.sub(lambda m: trans[m.group(1)], s)
+
+def esc_sp(s):
+    return esc(s).replace(' ', '&nbsp;')
+
+class html_record():
+    def __init__(self, data):
+        assert len(data) == int(data[:5])
+        self.data = data
+        self.leader = data[:24]
+        self.is_marc8 = data[9] != 'a'
+    def html(self):
+        return '<br>\n'.join(self.html_line(t, l) for t, l in get_all_tag_lines(self.data))
+
+    def html_subfields(self, line):
+        assert line[-1] == '\x1e'
+        encode = {
+            'k': lambda s: '<b>$%s</b>' % esc(translate(s, self.is_marc8)),
+            'v': lambda s: esc(translate(s, self.is_marc8)),
+        }
+        return ''.join(encode[k](v) for k, v in split_line(line[2:-1]))
+
+    def html_line(self, tag, line):
+        if tag.startswith('00'):
+            s = esc_sp(line[:-1])
+        else:
+            s = esc_sp(line[0:2]) + ' ' + self.html_subfields(line)
+        return u'<large>' + tag + u'</large> <code>' + s + u'</code>'
+
+def test_html_subfields():
+    samples = [
+        ('  \x1fa0123456789\x1e', '<b>$a</b>0123456789'),
+        ('  end of wrapped\x1e', 'end of wrapped'),
+        ('  \x1fa<whatever>\x1e', '<b>$a</b>&lt;whatever&gt;'),
+    ]
+    for input, output in samples:
+        assert html_subfields(input) == output
+
+def test_html_line():
+    samples = [
+        ('020', '  \x1fa0123456789\x1e', '&nbsp;&nbsp; <b>$a</b>0123456789'),
+        ('520', '  end of wrapped\x1e', '&nbsp;&nbsp; end of wrapped'),
+        ('245', '10\x1faDbu ma la \xca\xbejug pa\xca\xbei kar t\xcc\xa3i\xcc\x84k :\x1fbDwags-brgyud grub pa\xca\xbei s\xcc\x81in\xcc\x87 rta /\x1fcKarma-pa Mi-bskyod-rdo-rje.\x1e', u'10 <b>$a</b>Dbu ma la \u02bejug pa\u02bei kar \u1e6d\u012bk :<b>$b</b>Dwags-brgyud grub pa\u02bei \u015bi\u1e45 rta /<b>$c</b>Karma-pa Mi-bskyod-rdo-rje.'),
+    ]
+
+    for tag, input, output in samples:
+        expect = '<large>%s</large> <code>%s</code>' % (tag, output)
+        assert html_line(tag, input) == expect
diff --git a/ia-legacy-importer/marc/lang.py b/ia-legacy-importer/marc/lang.py
new file mode 100644
index 00000000..c0a4b15d
--- /dev/null
+++ b/ia-legacy-importer/marc/lang.py
@@ -0,0 +1,14 @@
+from catalog.infostore import get_site
+import web
+
+site = get_site()
+lang = set(site.things({'type': '/type/language'}))
+
+def add_lang(edition):
+    if 'languages' not in edition:
+        return
+    key = edition['languages'][0]['key']
+    if key in ('/l/   ', '/l/|||'):
+        del edition['languages']
+    elif key not in lang:
+        del edition['languages']
diff --git a/ia-legacy-importer/marc/marc_base.py b/ia-legacy-importer/marc/marc_base.py
new file mode 100644
index 00000000..daa4e35b
--- /dev/null
+++ b/ia-legacy-importer/marc/marc_base.py
@@ -0,0 +1,36 @@
+import re
+
+re_isbn = re.compile(r'([^ ()]+[\dX])(?: \((?:v\. (\d+)(?: : )?)?(.*)\))?')
+# handle ISBN like: 1402563884c$26.95
+re_isbn_and_price = re.compile(r'^([-\d]+X?)c\$[\d.]+$')
+
+class MarcException(Exception):
+    # Base MARC exception class
+    pass
+
+class BadMARC(MarcException):
+    pass
+
+class NoTitle(MarcException):
+    pass
+
+class MarcBase(object):
+    def read_isbn(self, f):
+        found = []
+        for k, v in f.get_subfields(['a', 'z']):
+            m = re_isbn_and_price.match(v)
+            if not m:
+                m = re_isbn.match(v)
+            if not m:
+                continue
+            found.append(m.group(1))
+        return found
+
+    def build_fields(self, want):
+        self.fields = {}
+        want = set(want)
+        for tag, line in self.read_fields(want):
+            self.fields.setdefault(tag, []).append(line)
+
+    def get_fields(self, tag):
+        return [self.decode_field(i) for i in self.fields.get(tag, [])]
diff --git a/ia-legacy-importer/marc/marc_binary.py b/ia-legacy-importer/marc/marc_binary.py
new file mode 100644
index 00000000..c1d7c718
--- /dev/null
+++ b/ia-legacy-importer/marc/marc_binary.py
@@ -0,0 +1,200 @@
+from pymarc import MARC8ToUnicode
+from unicodedata import normalize
+
+from openlibrary.catalog.marc import mnemonics
+from openlibrary.catalog.marc.marc_base import MarcBase, MarcException, BadMARC
+
+
+import six
+
+
+marc8 = MARC8ToUnicode(quiet=True)
+
+
+class BadLength(MarcException):
+    pass
+
+
+def norm(s):
+    return normalize('NFC', six.text_type(s))
+
+
+def handle_wrapped_lines(_iter):
+    """ 
+    Handles wrapped MARC fields, which appear to be multiple
+    fields with the same field number ending with ++
+    Have not found an official spec which describe this.
+    """
+    cur_lines = []
+    cur_tag = None
+    maybe_wrap = False
+    for t, l in _iter:
+        if len(l) > 500 and l.endswith('++\x1e'):
+            assert not cur_tag or cur_tag == t
+            cur_tag = t
+            cur_lines.append(l)
+            continue
+        if cur_lines:
+            yield cur_tag, cur_lines[0][:-3] + ''.join(i[2:-3] for i in cur_lines[1:]) + l[2:]
+            cur_tag = None
+            cur_lines = []
+            continue
+        yield t, l
+    assert not cur_lines
+
+
+class BinaryDataField():
+    def __init__(self, rec, line):
+        self.rec = rec
+        if line:
+            while line[-2] == '\x1e': # ia:engineercorpsofhe00sher
+                line = line[:-1]
+        self.line = line
+
+    def translate(self, data):
+        utf8 = self.rec.leader()[9] == 'a'
+        if utf8:
+            try:
+                data = data.decode('utf-8')
+            except:
+                utf8 = False
+        if not utf8:
+            data = mnemonics.read(data)
+            data = marc8.translate(data)
+        data = normalize('NFC', data)
+        return data
+
+    def ind1(self):
+        return self.line[0]
+
+    def ind2(self):
+        return self.line[1]
+
+    def remove_brackets(self):
+        line = self.line
+        if line[4] == '[' and line[-2] == ']':
+            self.line = line[0:4] + line[5:-2] + line[-1]
+
+    def get_subfields(self, want):
+        want = set(want)
+        for i in self.line[3:-1].split('\x1f'):
+            if i and i[0] in want:
+                yield i[0], self.translate(i[1:])
+
+    def get_contents(self, want):
+        contents = {}
+        for k, v in self.get_subfields(want):
+            if v:
+                contents.setdefault(k, []).append(v)
+        return contents
+
+    def get_subfield_values(self, want):
+        return [v for k, v in self.get_subfields(want)]
+
+    def get_all_subfields(self):
+        for i in self.line[3:-1].split('\x1f'):
+            if i:
+                j = self.translate(i)
+                yield j[0], j[1:]
+
+    def get_lower_subfields(self):
+        for k, v in self.get_all_subfields():
+            if k.islower():
+                yield v
+
+
+class MarcBinary(MarcBase):
+    def __init__(self, data):
+        try:
+            assert len(data) and isinstance(data, six.string_types)
+            length = int(data[:5])
+        except:
+            raise BadMARC("No MARC data found")
+        if len(data) != length:
+            raise BadLength("Record length %s does not match reported length %s." % (len(data), length))
+        self.data = data
+        self.directory_end = data.find('\x1e')
+        if self.directory_end == -1:
+            raise BadMARC("MARC directory not found")
+
+    def iter_directory(self):
+        data = self.data
+        directory = data[24:self.directory_end]
+        if len(directory) % 12 != 0:
+            # directory is the wrong size
+            # sometimes the leader includes some utf-8 by mistake
+            directory = data[:self.directory_end].decode('utf-8')[24:]
+            if len(directory) % 12 != 0:
+                raise BadMARC("MARC directory invalid length")
+        iter_dir = (directory[i*12:(i+1)*12] for i in range(len(directory) / 12))
+        return iter_dir
+
+    def leader(self):
+        return self.data[:24]
+
+    def all_fields(self):
+        marc8 = self.leader()[9] != 'a'
+        for tag, line in handle_wrapped_lines(self.get_all_tag_lines()):
+            if tag.startswith('00'):
+                # marc_upei/marc-for-openlibrary-bigset.mrc:78997353:588
+                if tag == '008' and line == '':
+                    continue
+                assert line[-1] == '\x1e'
+                yield tag, line[:-1]
+            else:
+                yield tag, BinaryDataField(self, line)
+
+    def read_fields(self, want):
+        want = set(want)
+        marc8 = self.leader()[9] != 'a'
+        for tag, line in handle_wrapped_lines(self.get_tag_lines(want)):
+            if tag not in want:
+                continue
+            if tag.startswith('00'):
+                # marc_upei/marc-for-openlibrary-bigset.mrc:78997353:588
+                if tag == '008' and line == '':
+                    continue
+                assert line[-1] == '\x1e'
+                yield tag, line[:-1]
+            else:
+                yield tag, BinaryDataField(self, line)
+
+    def get_all_tag_lines(self):
+        for line in self.iter_directory():
+            yield (line[:3], self.get_tag_line(line))
+
+    def get_tag_lines(self, want):
+        want = set(want)
+        return [(line[:3], self.get_tag_line(line)) for line in self.iter_directory() if line[:3] in want]
+
+    def get_tag_line(self, line):
+        length = int(line[3:7])
+        offset = int(line[7:12])
+        data = self.data[self.directory_end:]
+        # handle off-by-one errors in MARC records
+        try:
+            if data[offset] != '\x1e':
+                offset += data[offset:].find('\x1e')
+            last = offset+length
+            if data[last] != '\x1e':
+                length += data[last:].find('\x1e')
+        except IndexError:
+            pass
+        tag_line = data[offset + 1:offset + length + 1]
+        if not line[0:2] == '00':
+            # marc_western_washington_univ/wwu_bibs.mrc_revrev.mrc:636441290:1277
+            if tag_line[1:8] == '{llig}\x1f':
+                tag_line = tag_line[0] + u'\uFE20' + tag_line[7:]
+        return tag_line
+
+    def decode_field(self, field):
+        return field  # noop on MARC binary
+
+    def read_isbn(self, f):
+        if '\x1f' in f.line:
+            return super(MarcBinary, self).read_isbn(f)
+        else:
+            m = re_isbn.match(f.line[3:-1])
+            if m:
+                return [m.group(1)]
+        return []
diff --git a/ia-legacy-importer/marc/marc_subject.py b/ia-legacy-importer/marc/marc_subject.py
new file mode 100644
index 00000000..7f06759f
--- /dev/null
+++ b/ia-legacy-importer/marc/marc_subject.py
@@ -0,0 +1,309 @@
+from __future__ import print_function
+from openlibrary.catalog.utils import remove_trailing_dot, remove_trailing_number_dot, flip_name
+import re
+from collections import defaultdict
+from openlibrary.catalog.get_ia import get_from_archive, marc_formats, urlopen_keep_trying
+from openlibrary.catalog.marc.marc_binary import MarcBinary
+from openlibrary.catalog.importer.db_read import get_mc
+from openlibrary.catalog.marc.marc_xml import BadSubtag, BlankTag
+from openlibrary.catalog.marc.marc_xml import read_marc_file, MarcXml, BlankTag, BadSubtag
+from lxml import etree
+
+subject_fields = set(['600', '610', '611', '630', '648', '650', '651', '662'])
+
+re_flip_name = re.compile('^(.+), ([A-Z].+)$')
+
+# 'Rhodes, Dan (Fictitious character)'
+re_fictitious_character = re.compile(r'^(.+), (.+)( \(.* character\))$')
+re_etc = re.compile('^(.+?)[, .]+etc[, .]?$', re.I)
+re_comma = re.compile('^([A-Z])([A-Za-z ]+?) *, ([A-Z][A-Z a-z]+)$')
+
+re_place_comma = re.compile('^(.+), (.+)$')
+re_paren = re.compile('[()]')
+def flip_place(s):
+    s = remove_trailing_dot(s)
+    # Whitechapel (London, England)
+    # East End (London, England)
+    # Whitechapel (Londres, Inglaterra)
+    if re_paren.search(s):
+        return s
+    m = re_place_comma.match(s)
+    return m.group(2) + ' ' + m.group(1) if m else s
+
+def flip_subject(s):
+    m = re_comma.match(s)
+    if m:
+        return m.group(3) + ' ' + m.group(1).lower()+m.group(2)
+    else:
+        return s
+
+def four_types(i):
+    want = set(['subject', 'time', 'place', 'person'])
+    ret = dict((k, i[k]) for k in want if k in i)
+    for j in (j for j in i.keys() if j not in want):
+        for k, v in i[j].items():
+            if 'subject' in ret:
+                ret['subject'][k] = ret['subject'].get(k, 0) + v
+            else:
+                ret['subject'] = {k: v}
+    return ret
+
+archive_url = "http://archive.org/download/"
+
+def bad_marc_alert(ia):
+    from pprint import pformat
+    msg_from = 'load_scribe@archive.org'
+    msg_to = 'edward@archive.org'
+    msg = '''\
+From: %s
+To: %s
+Subject: bad MARC: %s
+
+bad MARC: %s
+
+''' % (msg_from, msg_to, ia, ia)
+
+    import smtplib
+    server = smtplib.SMTP('mail.archive.org')
+    server.sendmail(msg_from, [msg_to], msg)
+    server.quit()
+
+def load_binary(ia):
+    url = archive_url + ia + '/' + ia + '_meta.mrc'
+    f = urlopen_keep_trying(url)
+    data = f.read()
+    assert '<title>Internet Archive: Page Not Found</title>' not in data[:200]
+    if len(data) != int(data[:5]):
+        data = data.decode('utf-8').encode('raw_unicode_escape')
+    if len(data) != int(data[:5]):
+        bad_marc_alert(ia)
+        return
+    return MarcBinary(data)
+
+def load_xml(ia):
+    url = archive_url + ia + '/' + ia + '_marc.xml'
+    f = urlopen_keep_trying(url)
+    root = etree.parse(f).getroot()
+    if root.tag == '{http://www.loc.gov/MARC21/slim}collection':
+        root = root[0]
+    return MarcXml(root)
+
+def subjects_for_work(rec):
+    field_map = {
+        'subject': 'subjects',
+        'place': 'subject_places',
+        'time': 'subject_times',
+        'person': 'subject_people',
+    }
+
+    subjects = four_types(read_subjects(rec))
+
+    return dict((field_map[k], v.keys()) for k, v in subjects.items())
+
+re_edition_key = re.compile(r'^/(?:b|books)/(OL\d+M)$')
+
+def get_subjects_from_ia(ia):
+    formats = marc_formats(ia)
+    if not any(formats.values()):
+        return {}
+    rec = None
+    if formats['bin']:
+        rec = load_binary(ia)
+    if not rec:
+        assert formats['xml']
+        rec = load_xml(ia)
+    return read_subjects(rec)
+
+def bad_source_record(e, sr):
+    from pprint import pformat
+    import smtplib
+    msg_from = 'marc_subject@archive.org'
+    msg_to = 'edward@archive.org'
+    msg = '''\
+From: %s
+To: %s
+Subject: bad source record: %s
+
+Bad source record: %s
+
+%s
+''' % (msg_from, msg_to, e['key'], sr, pformat(e))
+
+    server = smtplib.SMTP('mail.archive.org')
+    server.sendmail(msg_from, [msg_to], msg)
+    server.quit()
+
+re_ia_marc = re.compile(r'^(?:.*/)?([^/]+)_(marc\.xml|meta\.mrc)(:0:\d+)?$')
+def get_work_subjects(w, do_get_mc=True):
+    found = set()
+    for e in w['editions']:
+        sr = e.get('source_records', [])
+        if sr:
+            for i in sr:
+                if i.endswith('initial import'):
+                    bad_source_record(e, i)
+                    continue
+                if i.startswith('ia:') or i.startswith('marc:'):
+                    found.add(i)
+                    continue
+        else:
+            mc = None
+            if do_get_mc:
+                m = re_edition_key.match(e['key'])
+                mc = get_mc('/b/' + m.group(1))
+            if mc:
+                if mc.endswith('initial import'):
+                    bad_source_record(e, mc)
+                    continue
+                if not mc.startswith('amazon:') and not re_ia_marc.match(mc):
+                    found.add('marc:' + mc)
+    subjects = []
+    for sr in found:
+        if sr.startswith('marc:ia:'):
+            subjects.append(get_subjects_from_ia(sr[8:]))
+        elif sr.startswith('marc:'):
+            loc = sr[5:]
+            data = get_from_archive(loc)
+            rec = MarcBinary(data)
+            try:
+                subjects.append(read_subjects(rec))
+            except:
+                print(('bad MARC:', loc))
+                print(('data:', repr(data)))
+                raise
+        else:
+            assert sr.startswith('ia:')
+            subjects.append(get_subjects_from_ia(sr[3:]))
+    return combine_subjects(subjects)
+
+def tidy_subject(s):
+    s = s.strip()
+    if len(s) < 2:
+        print(('short subject:', repr(s)))
+    else:
+        s = s[0].upper() + s[1:]
+    m = re_etc.search(s)
+    if m:
+        return m.group(1)
+    s = remove_trailing_dot(s)
+    m = re_fictitious_character.match(s)
+    if m:
+        return m.group(2) + ' ' + m.group(1) + m.group(3)
+    m = re_comma.match(s)
+    if m:
+        return m.group(3) + ' ' + m.group(1) + m.group(2)
+    return s
+
+re_aspects = re.compile(' [Aa]spects$')
+def find_aspects(f):
+    cur = [(i, j) for i, j in f.get_subfields('ax')]
+    if len(cur) < 2 or cur[0][0] != 'a' or cur[1][0] != 'x':
+        return
+    a, x = cur[0][1], cur[1][1]
+    x = x.strip('. ')
+    a = a.strip('. ')
+    if not re_aspects.search(x):
+        return
+    if a == 'Body, Human':
+        a = 'the Human body'
+    return x + ' of ' + flip_subject(a)
+
+def read_subjects(rec):
+    subjects = defaultdict(lambda: defaultdict(int))
+    for tag, field in rec.read_fields(subject_fields):
+        f = rec.decode_field(field)
+        aspects = find_aspects(f)
+
+        if tag == '600': # people
+            name_and_date = []
+            for k, v in f.get_subfields(['a', 'b', 'c', 'd']):
+                v = '(' + v.strip('.() ') + ')' if k == 'd' else v.strip(' /,;:')
+                if k == 'a':
+                    m = re_flip_name.match(v)
+                    if m:
+                        v = flip_name(v)
+                name_and_date.append(v)
+            name = remove_trailing_dot(' '.join(name_and_date)).strip()
+            if name != '':
+                subjects['person'][name] += 1
+        elif tag == '610': # org
+            v = ' '.join(f.get_subfield_values('abcd'))
+            v = v.strip()
+            if v:
+                v = remove_trailing_dot(v).strip()
+            if v:
+                v = tidy_subject(v)
+            if v:
+                subjects['org'][v] += 1
+
+            for v in f.get_subfield_values('a'):
+                v = v.strip()
+                if v:
+                    v = remove_trailing_dot(v).strip()
+                if v:
+                    v = tidy_subject(v)
+                if v:
+                    subjects['org'][v] += 1
+        elif tag == '611': # event
+            v = ' '.join(j.strip() for i, j in f.get_all_subfields() if i not in 'vxyz')
+            if v:
+                v = v.strip()
+            v = tidy_subject(v)
+            if v:
+                subjects['event'][v] += 1
+        elif tag == '630': # work
+            for v in f.get_subfield_values(['a']):
+                v = v.strip()
+                if v:
+                    v = remove_trailing_dot(v).strip()
+                if v:
+                    v = tidy_subject(v)
+                if v:
+                    subjects['work'][v] += 1
+        elif tag == '650': # topical
+            for v in f.get_subfield_values(['a']):
+                if v:
+                    v = v.strip()
+                v = tidy_subject(v)
+                if v:
+                    subjects['subject'][v] += 1
+        elif tag == '651': # geo
+            for v in f.get_subfield_values(['a']):
+                if v:
+                    subjects['place'][flip_place(v).strip()] += 1
+
+        for v in f.get_subfield_values(['y']):
+            v = v.strip()
+            if v:
+                subjects['time'][remove_trailing_dot(v).strip()] += 1
+        for v in f.get_subfield_values(['v']):
+            v = v.strip()
+            if v:
+                v = remove_trailing_dot(v).strip()
+            v = tidy_subject(v)
+            if v:
+                subjects['subject'][v] += 1
+        for v in f.get_subfield_values(['z']):
+            v = v.strip()
+            if v:
+                subjects['place'][flip_place(v).strip()] += 1
+        for v in f.get_subfield_values(['x']):
+            v = v.strip()
+            if not v:
+                continue
+            if aspects and re_aspects.search(v):
+                continue
+            v = tidy_subject(v)
+            if v:
+                subjects['subject'][v] += 1
+
+    return dict((k, dict(v)) for k, v in subjects.items())
+
+def combine_subjects(subjects):
+    all_subjects = defaultdict(lambda: defaultdict(int))
+    for a in subjects:
+        for b, c in a.items():
+            for d, e in c.items():
+                all_subjects[b][d] += e
+
+    return dict((k, dict(v)) for k, v in all_subjects.items())
diff --git a/ia-legacy-importer/marc/marc_xml.py b/ia-legacy-importer/marc/marc_xml.py
new file mode 100644
index 00000000..acb18959
--- /dev/null
+++ b/ia-legacy-importer/marc/marc_xml.py
@@ -0,0 +1,134 @@
+from lxml import etree
+from unicodedata import normalize
+
+from openlibrary.catalog.marc.marc_base import MarcBase, MarcException
+
+import six
+
+data_tag = '{http://www.loc.gov/MARC21/slim}datafield'
+control_tag = '{http://www.loc.gov/MARC21/slim}controlfield'
+subfield_tag = '{http://www.loc.gov/MARC21/slim}subfield'
+leader_tag = '{http://www.loc.gov/MARC21/slim}leader'
+record_tag = '{http://www.loc.gov/MARC21/slim}record'
+collection_tag = '{http://www.loc.gov/MARC21/slim}collection'
+
+class BlankTag(MarcException):
+    pass
+
+class BadSubtag(MarcException):
+    pass
+
+def read_marc_file(f):
+    for event, elem in etree.iterparse(f, tag=record_tag):
+        yield MarcXml(elem)
+        elem.clear()
+
+def norm(s):
+    return normalize('NFC', six.text_type(s.replace(u'\xa0', ' ')))
+
+def get_text(e):
+    return norm(e.text) if e.text else u''
+
+class DataField:
+    def __init__(self, element):
+        assert element.tag == data_tag
+        self.element = element
+
+    def remove_brackets(self):
+        f = self.element[0]
+        l = self.element[-1]
+        if f.text and l.text and f.text.startswith('[') and l.text.endswith(']'):
+            f.text = f.text[1:]
+            l.text = l.text[:-1]
+
+    def ind1(self):
+        return self.element.attrib['ind1']
+    def ind2(self):
+        return self.element.attrib['ind2']
+
+    def read_subfields(self):
+        for i in self.element:
+            assert i.tag == subfield_tag
+            k = i.attrib['code']
+            if k == '':
+                raise BadSubtag
+            yield k, i
+
+    def get_lower_subfields(self):
+        for k, v in self.read_subfields():
+            if k.islower():
+                yield get_text(v)
+
+    def get_all_subfields(self):
+        for k, v in self.read_subfields():
+            yield k, get_text(v)
+
+    def get_subfields(self, want):
+        want = set(want)
+        for k, v in self.read_subfields():
+            if k not in want:
+                continue
+            yield k, get_text(v)
+
+    def get_subfield_values(self, want):
+        return [v for k, v in self.get_subfields(want)]
+
+    def get_contents(self, want):
+        contents = {}
+        for k, v in self.get_subfields(want):
+            if v:
+                contents.setdefault(k, []).append(v)
+        return contents
+
+class MarcXml(MarcBase):
+    def __init__(self, record):
+        if record.tag == collection_tag:
+            record = record[0]
+
+        assert record.tag == record_tag
+        self.record = record
+
+    def leader(self):
+        leader_element = self.record[0]
+        if not isinstance(leader_element.tag, str):
+            leader_element = self.record[1]
+        assert leader_element.tag == leader_tag
+        return get_text(leader_element)
+
+    def all_fields(self):
+        for i in self.record:
+            if i.tag != data_tag and i.tag != control_tag:
+                continue
+            if i.attrib['tag'] == '':
+                raise BlankTag
+            yield i.attrib['tag'], i
+
+    def read_fields(self, want):
+        want = set(want)
+
+        # http://www.archive.org/download/abridgedacademy00levegoog/abridgedacademy00levegoog_marc.xml
+
+        non_digit = False
+        for i in self.record:
+            if i.tag != data_tag and i.tag != control_tag:
+                continue
+            tag = i.attrib['tag']
+            if tag == '':
+                raise BlankTag
+            if tag == 'FMT':
+                continue
+            if not tag.isdigit():
+                non_digit = True
+            else:
+                if tag[0] != '9' and non_digit:
+                    raise BadSubtag
+
+            if i.attrib['tag'] not in want:
+                continue
+            yield i.attrib['tag'], i
+
+    def decode_field(self, field):
+        if field.tag == control_tag:
+            return get_text(field)
+        if field.tag == data_tag:
+            return DataField(field)
diff --git a/ia-legacy-importer/marc/mnemonics.py b/ia-legacy-importer/marc/mnemonics.py
new file mode 100644
index 00000000..5bd7f780
--- /dev/null
+++ b/ia-legacy-importer/marc/mnemonics.py
@@ -0,0 +1,718 @@
+# read MARC mnemonics
+# result is in MARC8 and still needs to be converted to Unicode
+
+import re
+
+re_brace = re.compile(r'(\{.+?\})', re.U)
+
+mapping = {
+ '{00}': '\x00',
+ '{01}': '\x01',
+ '{02}': '\x02',
+ '{03}': '\x03',
+ '{04}': '\x04',
+ '{05}': '\x05',
+ '{06}': '\x06',
+ '{07}': '\x07',
+ '{08}': '\x08',
+ '{09}': '\t',
+ '{0A}': '\n',
+ '{0B}': '\x0b',
+ '{0C}': '\x0c',
+ '{0D}': '\r',
+ '{0E}': '\x0e',
+ '{0F}': '\x0f',
+ '{0}': '0',
+ '{10}': '\x10',
+ '{11}': '\x11',
+ '{12}': '\x12',
+ '{13}': '\x13',
+ '{14}': '\x14',
+ '{15}': '\x15',
+ '{16}': '\x16',
+ '{17}': '\x17',
+ '{18}': '\x18',
+ '{19}': '\x19',
+ '{1A}': '\x1a',
+ '{1B}': '\x1b',
+ '{1C}': '\x1c',
+ '{1D}': '\x1d',
+ '{1E}': '\x1e',
+ '{1F}': '\x1f',
+ '{1}': '1',
+ '{20}': ' ',
+ '{21}': '!',
+ '{22}': '"',
+ '{23}': '#',
+ '{24}': '$',
+ '{25}': '%',
+ '{26}': '&',
+ '{27}': "'",
+ '{28}': '(',
+ '{29}': ')',
+ '{2A}': '*',
+ '{2B}': '+',
+ '{2C}': ',',
+ '{2D}': '-',
+ '{2E}': '.',
+ '{2F}': '/',
+ '{2}': '2',
+ '{30}': '0',
+ '{31}': '1',
+ '{32}': '2',
+ '{33}': '3',
+ '{34}': '4',
+ '{35}': '5',
+ '{36}': '6',
+ '{37}': '7',
+ '{38}': '8',
+ '{39}': '9',
+ '{3A}': ':',
+ '{3B}': ';',
+ '{3C}': '<',
+ '{3D}': '=',
+ '{3E}': '>',
+ '{3F}': '?',
+ '{3}': '3',
+ '{40}': '@',
+ '{41}': 'A',
+ '{42}': 'B',
+ '{43}': 'C',
+ '{44}': 'D',
+ '{45}': 'E',
+ '{46}': 'F',
+ '{47}': 'G',
+ '{48}': 'H',
+ '{49}': 'I',
+ '{4A}': 'J',
+ '{4B}': 'K',
+ '{4C}': 'L',
+ '{4D}': 'M',
+ '{4E}': 'N',
+ '{4F}': 'O',
+ '{4}': '4',
+ '{50}': 'P',
+ '{51}': 'Q',
+ '{52}': 'R',
+ '{53}': 'S',
+ '{54}': 'T',
+ '{55}': 'U',
+ '{56}': 'V',
+ '{57}': 'W',
+ '{58}': 'X',
+ '{59}': 'Y',
+ '{5A}': 'Z',
+ '{5B}': '[',
+ '{5C}': '\\',
+ '{5D}': ']',
+ '{5E}': '^',
+ '{5F}': '_',
+ '{5}': '5',
+ '{60}': '`',
+ '{61}': 'a',
+ '{62}': 'b',
+ '{63}': 'c',
+ '{64}': 'd',
+ '{65}': 'e',
+ '{66}': 'f',
+ '{67}': 'g',
+ '{68}': 'h',
+ '{69}': 'i',
+ '{6A}': 'j',
+ '{6B}': 'k',
+ '{6C}': 'l',
+ '{6D}': 'm',
+ '{6E}': 'n',
+ '{6F}': 'o',
+ '{6}': '6',
+ '{70}': 'p',
+ '{71}': 'q',
+ '{72}': 'r',
+ '{73}': 's',
+ '{74}': 't',
+ '{75}': 'u',
+ '{76}': 'v',
+ '{77}': 'w',
+ '{78}': 'x',
+ '{79}': 'y',
+ '{7A}': 'z',
+ '{7B}': '{',
+ '{7C}': '|',
+ '{7D}': '}',
+ '{7E}': '~',
+ '{7F}': '\x7f',
+ '{7}': '7',
+ '{80}': '\x80',
+ '{81}': '\x81',
+ '{82}': '\x82',
+ '{83}': '\x83',
+ '{84}': '\x84',
+ '{85}': '\x85',
+ '{86}': '\x86',
+ '{87}': '\x87',
+ '{88}': '\x88',
+ '{89}': '\x89',
+ '{8A}': '\x8a',
+ '{8B}': '\x8b',
+ '{8C}': '\x8c',
+ '{8D}': '\x8d',
+ '{8E}': '\x8e',
+ '{8F}': '\x8f',
+ '{8}': '8',
+ '{90}': '\x90',
+ '{91}': '\x91',
+ '{92}': '\x92',
+ '{93}': '\x93',
+ '{94}': '\x94',
+ '{95}': '\x95',
+ '{96}': '\x96',
+ '{97}': '\x97',
+ '{98}': '\x98',
+ '{99}': '\x99',
+ '{9A}': '\x9a',
+ '{9B}': '\x9b',
+ '{9C}': '\x9c',
+ '{9D}': '\x9d',
+ '{9E}': '\x9e',
+ '{9F}': '\x9f',
+ '{9}': '9',
+ '{A0}': '\xa0',
+ '{A1}': '\xa1',
+ '{A2}': '\xa2',
+ '{A3}': '\xa3',
+ '{A4}': '\xa4',
+ '{A5}': '\xa5',
+ '{A6}': '\xa6',
+ '{A7}': '\xa7',
+ '{A8}': '\xa8',
+ '{A9}': '\xa9',
+ '{AA}': '\xaa',
+ '{AB}': '\xab',
+ '{AC}': '\xac',
+ '{AD}': '\xad',
+ '{AElig}': '\xa5',
+ '{AE}': '\xae',
+ '{AF}': '\xaf',
+ '{Aacute}': '\xe2A',
+ '{Abreve}': '\xe6A',
+ '{Acirc}': '\xe3A',
+ '{Acy}': 'A',
+ '{Agrave}': '\xe1A',
+ '{Aogon}': '\xf1A',
+ '{Aring}': '\xeaA',
+ '{Atilde}': '\xe4A',
+ '{Auml}': '\xe8A',
+ '{A}': 'A',
+ '{B0}': '\xb0',
+ '{B1}': '\xb1',
+ '{B2}': '\xb2',
+ '{B3}': '\xb3',
+ '{B4}': '\xb4',
+ '{B5}': '\xb5',
+ '{B6}': '\xb6',
+ '{B7}': '\xb7',
+ '{B8}': '\xb8',
+ '{B9}': '\xb9',
+ '{BA}': '\xba',
+ '{BB}': '\xbb',
+ '{BC}': '\xbc',
+ '{BD}': '\xbd',
+ '{BE}': '\xbe',
+ '{BF}': '\xbf',
+ '{Bcy}': 'B',
+ '{B}': 'B',
+ '{C0}': '\xc0',
+ '{C1}': '\xc1',
+ '{C2}': '\xc2',
+ '{C3}': '\xc3',
+ '{C4}': '\xc4',
+ '{C5}': '\xc5',
+ '{C6}': '\xc6',
+ '{C7}': '\xc7',
+ '{C8}': '\xc8',
+ '{C9}': '\xc9',
+ '{CA}': '\xca',
+ '{CB}': '\xcb',
+ '{CC}': '\xcc',
+ '{CD}': '\xcd',
+ '{CE}': '\xce',
+ '{CF}': '\xcf',
+ '{CHcy}': 'Ch',
+ '{Cacute}': '\xe2C',
+ '{Ccaron}': '\xe9C',
+ '{Ccedil}': '\xf0C',
+ '{C}': 'C',
+ '{D0}': '\xd0',
+ '{D1}': '\xd1',
+ '{D2}': '\xd2',
+ '{D3}': '\xd3',
+ '{D4}': '\xd4',
+ '{D5}': '\xd5',
+ '{D6}': '\xd6',
+ '{D7}': '\xd7',
+ '{D8}': '\xd8',
+ '{D9}': '\xd9',
+ '{DA}': '\xda',
+ '{DB}': '\xdb',
+ '{DC}': '\xdc',
+ '{DD}': '\xdd',
+ '{DE}': '\xde',
+ '{DF}': '\xdf',
+ '{DJEcy}': '\xa3',
+ '{DZEcy}': 'Dz',
+ '{DZHEcy}': 'D\xe9z',
+ '{Dagger}': '|',
+ '{Dcaron}': '\xe9D',
+ '{Dcy}': 'D',
+ '{Dstrok}': '\xa3',
+ '{D}': 'D',
+ '{E0}': '\xe0',
+ '{E1}': '\xe1',
+ '{E2}': '\xe2',
+ '{E3}': '\xe3',
+ '{E4}': '\xe4',
+ '{E5}': '\xe5',
+ '{E6}': '\xe6',
+ '{E7}': '\xe7',
+ '{E8}': '\xe8',
+ '{E9}': '\xe9',
+ '{EA}': '\xea',
+ '{EB}': '\xeb',
+ '{EC}': '\xec',
+ '{ED}': '\xed',
+ '{EE}': '\xee',
+ '{EF}': '\xef',
+ '{ETH}': '\xa3',
+ '{Eacute}': '\xe2E',
+ '{Ecaron}': '\xe9E',
+ '{Ecirc}': '\xe3E',
+ '{Ecy}': '\xe7E',
+ '{Egrave}': '\xe1E',
+ '{Ehookr}': '\xf1E',
+ '{Eogon}': '\xf1E',
+ '{Euml}': '\xe8E',
+ '{E}': 'E',
+ '{F0}': '\xf0',
+ '{F1}': '\xf1',
+ '{F2}': '\xf2',
+ '{F3}': '\xf3',
+ '{F4}': '\xf4',
+ '{F5}': '\xf5',
+ '{F6}': '\xf6',
+ '{F7}': '\xf7',
+ '{F8}': '\xf8',
+ '{F9}': '\xf9',
+ '{FA}': '\xfa',
+ '{FB}': '\xfb',
+ '{FC}': '\xfc',
+ '{FD}': '\xfd',
+ '{FE}': '\xfe',
+ '{FF}': '\xff',
+ '{Fcy}': 'F',
+ '{F}': 'F',
+ '{GEcy}': 'G',
+ '{GHcy}': 'G',
+ '{GJEcy}': '\xe2G',
+ '{Gcy}': 'G',
+ '{G}': 'G',
+ '{HARDcy}': '\xb7',
+ '{Hcy}': 'H',
+ '{H}': 'H',
+ '{IEcy}': '\xebI\xecE',
+ '{IJlig}': 'IJ',
+ '{IOcy}': '\xebI\xecO',
+ '{IYcy}': 'Y',
+ '{Iacute}': '\xe2I',
+ '{Icaron}': '\xe9I',
+ '{Icirc}': '\xe3I',
+ '{Icy}': 'I',
+ '{Idot}': '\xe7I',
+ '{Igrave}': '\xe1I',
+ '{Iumlcy}': '\xe8I',
+ '{Iuml}': '\xe8I',
+ '{I}': 'I',
+ '{JEcy}': 'J',
+ '{JIcy}': '\xe8I',
+ '{Jcy}': '\xe6I',
+ '{J}': 'J',
+ '{KHcy}': 'Kh',
+ '{KJEcy}': '\xe2K',
+ '{Kcy}': 'K',
+ '{K}': 'K',
+ '{LJEcy}': 'Lj',
+ '{Lacute}': '\xe2L',
+ '{Lcy}': 'L',
+ '{Lstrok}': '\xa1',
+ '{L}': 'L',
+ '{Mcy}': 'M',
+ '{M}': 'M',
+ '{NJEcy}': 'Nj',
+ '{Nacute}': '\xe2N',
+ '{Ncaron}': '\xe9N',
+ '{Ncy}': 'N',
+ '{No}': 'No.',
+ '{Ntilde}': '\xb4N',
+ '{N}': 'N',
+ '{OElig}': '\xa6',
+ '{Oacute}': '\xe2O',
+ '{Ocirc}': '\xe3O',
+ '{Ocy}': 'O',
+ '{Odblac}': '\xeeO',
+ '{Ograve}': '\xe1O',
+ '{Ohorn}': '\xac',
+ '{Ostrok}': '\xa2',
+ '{Otilde}': '\xe4O',
+ '{Ouml}': '\xe8O',
+ '{O}': 'O',
+ '{Pcy}': 'P',
+ '{P}': 'P',
+ '{Q}': 'Q',
+ '{Racute}': '\xe2R',
+ '{Rcaron}': '\xe9R',
+ '{Rcy}': 'R',
+ '{R}': 'R',
+ '{SHCHcy}': 'Shch',
+ '{SHcy}': 'Sh',
+ '{SOFTcy}': '\xa7',
+ '{Sacute}': '\xe2S',
+ '{Scommab}': '\xf7S',
+ '{Scy}': 'S',
+ '{S}': 'S',
+ '{THORN}': '\xa4',
+ '{TSHEcy}': '\xe2C',
+ '{TScy}': '\xebT\xecS',
+ '{Tcaron}': '\xe9T',
+ '{Tcommab}': '\xf7T',
+ '{Tcy}': 'T',
+ '{T}': 'T',
+ '{Uacute}': '\xe2U',
+ '{Ubrevecy}': '\xe6U',
+ '{Ucirc}': '\xe3U',
+ '{Ucy}': 'U',
+ '{Udblac}': '\xeeU',
+ '{Ugrave}': '\xe1U',
+ '{Uhorn}': '\xad',
+ '{Uring}': '\xeaU',
+ '{Uuml}': '\xe8U',
+ '{U}': 'U',
+ '{Vcy}': 'V',
+ '{V}': 'V',
+ '{W}': 'W',
+ '{X}': 'X',
+ '{YAcy}': '\xebI\xecA',
+ '{YEcy}': 'E',
+ '{YIcy}': 'I',
+ '{YUcy}': '\xebI\xecU',
+ '{Yacute}': '\xe2Y',
+ '{Ycy}': 'Y',
+ '{Y}': 'Y',
+ '{ZHcy}': 'Zh',
+ '{ZHuacy}': '\xebZ\xech',
+ '{Zacute}': '\xe2Z',
+ '{Zcy}': 'Z',
+ '{Zdot}': '\xe7Z',
+ '{Z}': 'Z',
+ '{aacute}': '\xe2a',
+ '{abreve}': '\xe6a',
+ '{acirc}': '\xe3a',
+ '{acute}': '\xe2',
+ '{acy}': 'a',
+ '{aelig}': '\xb5',
+ '{agrave}': '\xe1a',
+ '{agr}': 'b',
+ '{alif}': '\xae',
+ '{amp}': '&',
+ '{aogon}': '\xf1a',
+ '{apos}': "'",
+ '{arab}': '(3',
+ '{aring}': '\xeaa',
+ '{ast}': '*',
+ '{asuper}': 'a',
+ '{atilde}': '\xe4a',
+ '{auml}': '\xe8a',
+ '{ayn}': '\xb0',
+ '{a}': 'a',
+ '{bcy}': 'b',
+ '{bgr}': 'c',
+ '{breveb}': '\xf9',
+ '{breve}': '\xe6',
+ '{brvbar}': '|',
+ '{bsol}': '\\',
+ '{bull}': '*',
+ '{b}': 'b',
+ '{cacute}': '\xe2c',
+ '{candra}': '\xef',
+ '{caron}': '\xe9',
+ '{ccaron}': '\xe9c',
+ '{ccedil}': '\xf0c',
+ '{cedil}': '\xf0',
+ '{cent}': 'c',
+ '{chcy}': 'ch',
+ '{circb}': '\xf4',
+ '{circ}': '\xe3',
+ '{cjk}': '$1',
+ '{colon}': ':',
+ '{commaa}': '\xfe',
+ '{commab}': '\xf7',
+ '{commat}': '@',
+ '{comma}': ',',
+ '{copy}': '\xc3',
+ '{curren}': '*',
+ '{cyril}': '(N',
+ '{c}': 'c',
+ '{dagger}': '|',
+ '{dblac}': '\xee',
+ '{dbldotb}': '\xf3',
+ '{dblunder}': '\xf5',
+ '{dcaron}': '\xe9d',
+ '{dcy}': 'd',
+ '{deg}': '\xc0',
+ '{diaer}': '\xe8',
+ '{divide}': '/',
+ '{djecy}': '\xb3',
+ '{dollar}': '$',
+ '{dotb}': '\xf2',
+ '{dot}': '\xe7',
+ '{dstrok}': '\xb3',
+ '{dzecy}': 'dz',
+ '{dzhecy}': 'd\xe9z',
+ '{d}': 'd',
+ '{eacute}': '\xe2e',
+ '{ea}': '\xea',
+ '{ecaron}': '\xe9e',
+ '{ecirc}': '\xe3e',
+ '{ecy}': '\xe7e',
+ '{egrave}': '\xe1e',
+ '{ehookr}': '\xf1e',
+ '{eogon}': '\xf1e',
+ '{equals}': '=',
+ '{esc}': '\x1b',
+ '{eth}': '\xba',
+ '{euml}': '\xe8e',
+ '{excl}': '!',
+ '{e}': 'e',
+ '{fcy}': 'f',
+ '{flat}': '\xa9',
+ '{fnof}': 'f',
+ '{frac12}': '1/2',
+ '{frac14}': '1/4',
+ '{frac34}': '3/4',
+ '{f}': 'f',
+ '{gcy}': 'g',
+ '{gecy}': 'g',
+ '{ggr}': 'g',
+ '{ghcy}': 'g',
+ '{gjecy}': '\xe2g',
+ '{grave}': '\xe1',
+ '{greek}': 'g',
+ '{gs}': '\x1d',
+ '{gt}': '>',
+ '{g}': 'g',
+ '{hardcy}': '\xb7',
+ '{hardsign}': '\xb7',
+ '{hcy}': 'h',
+ '{hebrew}': '(2',
+ '{hellip}': '...',
+ '{hooka}': '\xe0',
+ '{hookl}': '\xf7',
+ '{hookr}': '\xf1',
+ '{hyphen}': '-',
+ '{h}': 'h',
+ '{iacute}': '\xe2i',
+ '{icaron}': '\xe9i',
+ '{icirc}': '\xe3i',
+ '{icy}': 'i',
+ '{iecy}': '\xebi\xece',
+ '{iexcl}': '\xc6',
+ '{igrave}': '\xe1i',
+ '{ijlig}': 'ij',
+ '{inodot}': '\xb8',
+ '{iocy}': '\xebi\xeco',
+ '{iquest}': '\xc5',
+ '{iumlcy}': '\xe8i',
+ '{iuml}': '\xe8i',
+ '{iycy}': 'y',
+ '{i}': 'i',
+ '{jcy}': '\xe6i',
+ '{jecy}': 'j',
+ '{jicy}': '\xe8i',
+ '{joiner}': '\x8d',
+ '{j}': 'j',
+ '{kcy}': 'k',
+ '{khcy}': 'kh',
+ '{kjecy}': '\xe2k',
+ '{k}': 'k',
+ '{lacute}': '\xe2l',
+ '{laquo}': '"',
+ '{latin}': '(B',
+ '{lcub}': '{',
+ '{lcy}': 'l',
+ '{ldbltil}': '\xfa',
+ '{ldquo}': '"',
+ '{ljecy}': 'lj',
+ '{llig}': '\xeb',
+ '{lpar}': '(',
+ '{lsqb}': '[',
+ '{lsquor}': "'",
+ '{lsquo}': "'",
+ '{lstrok}': '\xb1',
+ '{lt}': '<',
+ '{l}': 'l',
+ '{macr}': '\xe5',
+ '{mcy}': 'm',
+ '{mdash}': '--',
+ '{middot}': '\xa8',
+ '{mlPrime}': '\xb7',
+ '{mllhring}': '\xb0',
+ '{mlprime}': '\xa7',
+ '{mlrhring}': '\xae',
+ '{m}': 'm',
+ '{nacute}': '\xe2n',
+ '{ncaron}': '\xe9n',
+ '{ncy}': 'n',
+ '{ndash}': '--',
+ '{njecy}': 'nj',
+ '{nonjoin}': '\x8e',
+ '{ntilde}': '\xb4n',
+ '{num}': '#',
+ '{n}': 'n',
+ '{oacute}': '\xe2o',
+ '{ocirc}': '\xe3o',
+ '{ocy}': 'o',
+ '{odblac}': '\xeeo',
+ '{oelig}': '\xb6',
+ '{ogon}': '\xf1',
+ '{ograve}': '\xe1o',
+ '{ohorn}': '\xbc',
+ '{ordf}': 'a',
+ '{ordm}': 'o',
+ '{ostrok}': '\xb2',
+ '{osuper}': 'o',
+ '{otilde}': '\xe4o',
+ '{ouml}': '\xe8o',
+ '{o}': 'o',
+ '{para}': '|',
+ '{pcy}': 'p',
+ '{percnt}': '%',
+ '{period}': '.',
+ '{phono}': '\xc2',
+ '{pipe}': '|',
+ '{plusmn}': '\xab',
+ '{plus}': '+',
+ '{pound}': '\xb9',
+ '{p}': 'p',
+ '{quest}': '?',
+ '{quot}': '"',
+ '{q}': 'q',
+ '{racute}': '\xe2r',
+ '{raquo}': '"',
+ '{rcaron}': '\xe9r',
+ '{rcedil}': '\xf8',
+ '{rcommaa}': '\xed',
+ '{rcub}': '}',
+ '{rcy}': 'r',
+ '{rdbltil}': '\xfb',
+ '{rdquofh}': '"',
+ '{rdquor}': '"',
+ '{reg}': '\xaa',
+ '{ringb}': '\xf4',
+ '{ring}': '\xea',
+ '{rlig}': '\xec',
+ '{rpar}': ')',
+ '{rsqb}': ']',
+ '{rsquor}': "'",
+ '{rsquo}': "'",
+ '{rs}': '\x1e',
+ '{r}': 'r',
+ '{sacute}': '\xe2s',
+ '{scommab}': '\xf7s',
+ '{scriptl}': '\xc1',
+ '{scy}': 's',
+ '{sect}': '|',
+ '{semi}': ';',
+ '{sharp}': '\xc4',
+ '{shchcy}': 'shch',
+ '{shcy}': 'sh',
+ '{shy}': '-',
+ '{softcy}': '\xa7',
+ '{softsign}': '\xa7',
+ '{sol}': '/',
+ '{space}': ' ',
+ '{spcirc}': '^',
+ '{spgrave}': '`',
+ '{sptilde}': '~',
+ '{spundscr}': '_',
+ '{squf}': '|',
+ '{sub}': 'b',
+ '{sup1}': '\x1bp1\x1bs',
+ '{sup2}': '\x1bp2\x1bs',
+ '{sup3}': '\x1bp3\x1bs',
+ '{super}': 'p',
+ '{szlig}': 'ss',
+ '{s}': 's',
+ '{tcaron}': '\xe9t',
+ '{tcommab}': '\xf7t',
+ '{tcy}': 't',
+ '{thorn}': '\xb4',
+ '{tilde}': '\xe4',
+ '{times}': 'x',
+ '{trade}': '(Tm)',
+ '{tscy}': '\xebt\xecs',
+ '{tshecy}': '\xe2c',
+ '{t}': 't',
+ '{uacute}': '\xe2u',
+ '{ubrevecy}': '\xe6u',
+ '{ucirc}': '\xe3u',
+ '{ucy}': 'u',
+ '{udblac}': '\xeeu',
+ '{ugrave}': '\xe1u',
+ '{uhorn}': '\xbd',
+ '{uml}': '\xe8',
+ '{under}': '\xf6',
+ '{uring}': '\xeau',
+ '{us}': '\x1f',
+ '{uuml}': '\xe8u',
+ '{u}': 'u',
+ '{vcy}': 'v',
+ '{verbar}': '|',
+ '{vlineb}': '\xf2',
+ '{v}': 'v',
+ '{w}': 'w',
+ '{x}': 'x',
+ '{yacute}': '\xe2y',
+ '{yacy}': '\xebi\xeca',
+ '{ycy}': 'y',
+ '{yecy}': 'e',
+ '{yen}': 'Y',
+ '{yicy}': 'i',
+ '{yucy}': '\xebi\xecu',
+ '{y}': 'y',
+ '{zacute}': '\xe2z',
+ '{zcy}': 'z',
+ '{zdot}': '\xe7z',
+ '{zhcy}': 'zh',
+ '{zhuacy}': '\xebz\xech',
+ '{z}': 'z'}
+
+def load_table(filename):
+    mapping = {}
+    for line in (i.split(",") for i in open(filename) if i.startswith("{")):
+        key = line[0]
+        value = ""
+        for d in line[2].strip().split(" "):
+            assert len(d) == 4
+            assert d[3] == 'd'
+            value += chr(int(d[0:3]))
+
+        mapping[key] = value
+    return mapping
+
+def test_read():
+    input = 'Tha{mllhring}{macr}alib{macr}i, {mllhring}Abd al-Malik ibn Mu{dotb}hammad,'
+    output = 'Tha\xb0\xe5alib\xe5i, \xb0Abd al-Malik ibn Mu\xf2hammad,'
+    assert read(input) == output
+    input = 'El Ing.{eniero} Federico E. Capurro y el nacimiento de la profesi\xe2on bibliotecaria en el Uruguay.'
+    assert read(input) == input
+
+def read(input):
+    return re_brace.sub(lambda x: mapping.get(x.group(1), x.group(1)), input)
diff --git a/ia-legacy-importer/marc/parse.py b/ia-legacy-importer/marc/parse.py
new file mode 100644
index 00000000..7f314eae
--- /dev/null
+++ b/ia-legacy-importer/marc/parse.py
@@ -0,0 +1,628 @@
+import re
+
+from openlibrary.catalog.marc.get_subjects import subjects_for_work
+from openlibrary.catalog.marc.marc_base import BadMARC, NoTitle, MarcException
+from openlibrary.catalog.utils import pick_first_date, tidy_isbn, flip_name, remove_trailing_dot, remove_trailing_number_dot
+
+re_question = re.compile(r'^\?+$')
+re_lccn = re.compile(r'([ \dA-Za-z\-]{3}[\d/-]+).*')
+re_oclc = re.compile(r'^\(OCoLC\).*?0*(\d+)')
+re_ocolc = re.compile('^ocolc *$', re.I)
+re_ocn_or_ocm = re.compile(r'^oc[nm]0*(\d+) *$')
+re_int = re.compile(r'\d{2,}')
+re_number_dot = re.compile(r'\d{3,}\.$')
+re_bracket_field = re.compile(r'^\s*(\[.*\])\.?\s*$')
+foc = '[from old catalog]'
+
+def strip_foc(s):
+    return s[:-len(foc)].rstrip() if s.endswith(foc) else s
+
+class SeeAlsoAsTitle(MarcException):
+    pass
+
+want = [
+    '001',
+    '003',  # for OCLC
+    '008',  # publish date, country and language
+    '010',  # lccn
+    '020',  # isbn
+    '035',  # oclc
+    '050',  # lc classification
+    '082',  # dewey
+    '100', '110', '111',  # authors
+    '130', '240', # work title
+    '245',  # title
+    '250',  # edition
+    '260',  # publisher
+    '300',  # pagination
+    '440', '490', '830'  # series
+    ] + [str(i) for i in range(500, 588)] + [  # notes + toc + description
+    # 6XX subjects are extracted separately by get_subjects.subjects_for_work()
+    '700', '710', '711', '720',  # contributions
+    '246', '730', '740',  # other titles
+    '852',  # location
+    '856']  # URL
+
+def read_lccn(rec):
+    fields = rec.get_fields('010')
+    if not fields:
+        return
+
+    found = []
+    for f in fields:
+        for k, v in f.get_subfields(['a']):
+            lccn = v.strip()
+            if re_question.match(lccn):
+                continue
+            m = re_lccn.search(lccn)
+            if not m:
+                continue
+            lccn = m.group(1).strip()
+            # zero-pad any dashes so the final digit group has size = 6
+            lccn = lccn.replace('-', '0'*(7 - (len(lccn) - lccn.find('-'))))
+            if lccn:
+                found.append(lccn)
+    return found
+
+def remove_duplicates(seq):
+    u = []
+    for x in seq:
+        if x not in u:
+            u.append(x)
+    return u
+
+def read_oclc(rec):
+    found = []
+    tag_001 = rec.get_fields('001')
+    tag_003 = rec.get_fields('003')
+    if tag_001 and tag_003 and re_ocolc.match(tag_003[0]):
+        oclc = tag_001[0]
+        m = re_ocn_or_ocm.match(oclc)
+        if m:
+            oclc = m.group(1)
+        if oclc.isdigit():
+            found.append(oclc)
+
+    for f in rec.get_fields('035'):
+        for k, v in f.get_subfields(['a']):
+            m = re_oclc.match(v)
+            if not m:
+                m = re_ocn_or_ocm.match(v)
+                if m and not m.group(1).isdigit():
+                    m = None
+            if m:
+                oclc = m.group(1)
+                if oclc not in found:
+                    found.append(oclc)
+    return remove_duplicates(found)
+
+def read_lc_classification(rec):
+    fields = rec.get_fields('050')
+    if not fields:
+        return
+
+    found = []
+    for f in fields:
+        contents = f.get_contents(['a', 'b'])
+        if 'b' in contents:
+            b = ' '.join(contents['b'])
+            if 'a' in contents:
+                found += [' '.join([a, b]) for a in contents['a']]
+            else:
+                found += [b]
+        # http://openlibrary.org/show-marc/marc_university_of_toronto/uoft.marc:671135731:596
+        elif 'a' in contents:
+            found += contents['a']
+    return found
+
+def read_isbn(rec):
+    fields = rec.get_fields('020')
+    if not fields:
+        return
+
+    found = []
+    for f in fields:
+        isbn = rec.read_isbn(f)
+        if isbn:
+            found += isbn
+    ret = {}
+    seen = set()
+
+    for i in tidy_isbn(found):
+        if i in seen: # avoid dups
+            continue
+        seen.add(i)
+        if len(i) == 13:
+            ret.setdefault('isbn_13', []).append(i)
+        elif len(i) <= 16:
+            ret.setdefault('isbn_10', []).append(i)
+    return ret
+
+def read_dewey(rec):
+    fields = rec.get_fields('082')
+    if not fields:
+        return
+    found = []
+    for f in fields:
+        found += f.get_subfield_values(['a'])
+    return found
+
+def read_work_titles(rec):
+    found = []
+    tag_240 = rec.get_fields('240')
+    if tag_240:
+        for f in tag_240:
+            title = f.get_subfield_values(['a', 'm', 'n', 'p', 'r'])
+            found.append(remove_trailing_dot(' '.join(title).strip(',')))
+
+    tag_130 = rec.get_fields('130')
+    if tag_130:
+        for f in tag_130:
+            title = ' '.join(v for k, v in f.get_all_subfields() if k.islower() and k != 'n')
+            found.append(remove_trailing_dot(title.strip(',')))
+
+    return remove_duplicates(found)
+
+def read_title(rec):
+    fields = rec.get_fields('245')
+    if not fields:
+        fields = rec.get_fields('740')
+    if not fields:
+        raise NoTitle("No Title found in either 245 or 740 fields.")
+
+#   example MARC record with multiple titles:
+#   http://openlibrary.org/show-marc/marc_western_washington_univ/wwu_bibs.mrc_revrev.mrc:299505697:862
+    contents = fields[0].get_contents(['a', 'b', 'c', 'h', 'p'])
+
+    b_and_p = [i for i in fields[0].get_subfield_values(['b', 'p']) if i]
+
+    ret = {}
+    title = None
+
+#   MARC record with 245a missing:
+#   http://openlibrary.org/show-marc/marc_western_washington_univ/wwu_bibs.mrc_revrev.mrc:516779055:1304
+    if 'a' in contents:
+        title = ' '.join(x.strip(' /,;:') for x in contents['a'])
+    elif b_and_p:
+        title = b_and_p.pop(0).strip(' /,;:')
+# talis_openlibrary_contribution/talis-openlibrary-contribution.mrc:183427199:255
+    if title in ('See.', 'See also.'):
+        raise SeeAlsoAsTitle("Title is: %s" % title)
+# talis_openlibrary_contribution/talis-openlibrary-contribution.mrc:5654086:483
+# scrapbooksofmoun03tupp
+    if title is None:
+        subfields = list(fields[0].get_all_subfields())
+        title = ' '.join(v for k, v in subfields)
+        if not title: # ia:scrapbooksofmoun03tupp
+            raise NoTitle("No title found from joining subfields.")
+    ret['title'] = remove_trailing_dot(title)
+    if b_and_p:
+        ret["subtitle"] = ' : '.join(remove_trailing_dot(x.strip(' /,;:')) for x in b_and_p)
+    if 'c' in contents:
+        ret["by_statement"] = remove_trailing_dot(' '.join(contents['c']))
+    if 'h' in contents:
+        h = ' '.join(contents['h']).strip(' ')
+        m = re_bracket_field.match(h)
+        if m:
+            h = m.group(1)
+        assert h
+        ret["physical_format"] = h
+    return ret
+
+def read_edition_name(rec):
+    fields = rec.get_fields('250')
+    if not fields:
+        return
+    found = []
+    for f in fields:
+        f.remove_brackets()
+        found += [v for k, v in f.get_all_subfields()]
+    return ' '.join(found)
+
+lang_map = {
+    'ser': 'srp', # http://www.archive.org/details/zadovoljstvauivo00lubb
+    'end': 'eng',
+    'enk': 'eng',
+    'ent': 'eng',
+    'cro': 'chu',
+    'jap': 'jpn',
+    'fra': 'fre',
+    'gwr': 'ger',
+    'sze': 'slo',
+    'fr ': 'fre',
+    'fle': 'dut', # flemish -> dutch
+    'it ': 'ita',
+}
+
+def read_languages(rec):
+    fields = rec.get_fields('041')
+    if not fields:
+        return
+    found = []
+    for f in fields:
+        found += [i.lower() for i in f.get_subfield_values('a') if i and len(i) == 3]
+    return [lang_map.get(i, i) for i in found if i != 'zxx']
+
+def read_pub_date(rec):
+    fields = rec.get_fields('260')
+    if not fields:
+        return
+    found = []
+    for f in fields:
+        f.remove_brackets()
+        found += [i for i in f.get_subfield_values('c') if i]
+    return remove_trailing_number_dot(found[0]) if found else None
+
+def read_publisher(rec):
+    fields = rec.get_fields('260')
+    if not fields:
+        return
+    publisher = []
+    publish_places = []
+    for f in fields:
+        f.remove_brackets()
+        contents = f.get_contents(['a', 'b'])
+        if 'b' in contents:
+            publisher += [x.strip(" /,;:") for x in contents['b']]
+        if 'a' in contents:
+            publish_places += [x.strip(" /.,;:") for x in contents['a'] if x]
+    edition = {}
+    if publisher:
+        edition["publishers"] = publisher
+    if len(publish_places) and publish_places[0]:
+        edition["publish_places"] = publish_places
+    return edition
+
+def read_author_person(f):
+    f.remove_brackets()
+    author = {}
+    contents = f.get_contents(['a', 'b', 'c', 'd', 'e'])
+    if 'a' not in contents and 'c' not in contents:
+        return # should at least be a name or title
+    name = [v.strip(' /,;:') for v in f.get_subfield_values(['a', 'b', 'c'])]
+    if 'd' in contents:
+        author = pick_first_date(strip_foc(d).strip(',') for d in contents['d'])
+        if 'death_date' in author and author['death_date']:
+            death_date = author['death_date']
+            if re_number_dot.search(death_date):
+                author['death_date'] = death_date[:-1]
+
+    author['name'] = ' '.join(name)
+    author['entity_type'] = 'person'
+    subfields = [
+        ('a', 'personal_name'),
+        ('b', 'numeration'),
+        ('c', 'title'),
+        ('e', 'role')
+    ]
+    for subfield, field_name in subfields:
+        if subfield in contents:
+            author[field_name] = remove_trailing_dot(' '.join([x.strip(' /,;:') for x in contents[subfield]]))
+    if 'q' in contents:
+        author['fuller_name'] = ' '.join(contents['q'])
+    for f in 'name', 'personal_name':
+        if f in author:
+            author[f] = remove_trailing_dot(strip_foc(author[f]))
+    return author
+
+# 1. if authors in 100, 110, 111 use them
+# 2. if first contrib is 700, 710, or 711 use it
+
+def person_last_name(f):
+    v = list(f.get_subfield_values('a'))[0]
+    return v[:v.find(', ')] if ', ' in v else v
+
+def last_name_in_245c(rec, person):
+    fields = rec.get_fields('245')
+    if not fields:
+        return
+    last_name = person_last_name(person).lower()
+    return any(any(last_name in v.lower() for v in f.get_subfield_values(['c'])) for f in fields)
+
+def read_authors(rec):
+    count = 0
+    fields_100 = rec.get_fields('100')
+    fields_110 = rec.get_fields('110')
+    fields_111 = rec.get_fields('111')
+    count = len(fields_100) + len(fields_110) + len(fields_111)
+    if count == 0:
+        return
+    # talis_openlibrary_contribution/talis-openlibrary-contribution.mrc:11601515:773 has two authors:
+    # 100 1  $aDowling, James Walter Frederick.
+    # 111 2  $aConference on Civil Engineering Problems Overseas.
+
+    found = [f for f in (read_author_person(f) for f in fields_100) if f]
+    for f in fields_110:
+        f.remove_brackets()
+        name = [v.strip(' /,;:') for v in f.get_subfield_values(['a', 'b'])]
+        found.append({ 'entity_type': 'org', 'name': remove_trailing_dot(' '.join(name))})
+    for f in fields_111:
+        f.remove_brackets()
+        name = [v.strip(' /,;:') for v in f.get_subfield_values(['a', 'c', 'd', 'n'])]
+        found.append({ 'entity_type': 'event', 'name': remove_trailing_dot(' '.join(name))})
+    if found:
+        return found
+
+# no monograph should be longer than 50,000 pages
+max_number_of_pages = 50000
+
+def read_pagination(rec):
+    fields = rec.get_fields('300')
+    if not fields:
+        return
+
+    pagination = []
+    edition = {}
+    for f in fields:
+        pagination += f.get_subfield_values(['a'])
+    if pagination:
+        edition['pagination'] = ' '.join(pagination)
+        # strip trailing characters from pagination
+        edition['pagination'] = edition['pagination'].strip(' ,:;')
+        num = [] # http://openlibrary.org/show-marc/marc_university_of_toronto/uoft.marc:2617696:825
+        for x in pagination:
+            num += [int(i) for i in re_int.findall(x.replace(',',''))]
+            num += [int(i) for i in re_int.findall(x)]
+        valid = [i for i in num if i < max_number_of_pages]
+        if valid:
+            edition['number_of_pages'] = max(valid)
+    return edition
+
+def read_series(rec):
+    found = []
+    for tag in ('440', '490', '830'):
+        fields = rec.get_fields(tag)
+        if not fields:
+            continue
+        for f in fields:
+            this = []
+            for k, v in f.get_subfields(['a', 'v']):
+                if k == 'v' and v:
+                    this.append(v)
+                    continue
+                v = v.rstrip('.,; ')
+                if v:
+                    this.append(v)
+            if this:
+                found += [' -- '.join(this)]
+    return found
+
+def read_notes(rec):
+    found = []
+    for tag in range(500,595):
+        if tag in (505, 520):
+            continue
+        fields = rec.get_fields(str(tag))
+        if not fields:
+            continue
+        for f in fields:
+            x = f.get_lower_subfields()
+            if x:
+                found.append(' '.join(x).strip(' '))
+    if found:
+        return '\n\n'.join(found)
+
+def read_description(rec):
+    fields = rec.get_fields('520')
+    if not fields:
+        return
+    found = []
+    for f in fields:
+        this = [i for i in f.get_subfield_values(['a']) if i]
+        found += this
+    if found:
+        return "\n\n".join(found).strip(' ')
+
+def read_url(rec):
+    found = []
+    for f in rec.get_fields('856'):
+        contents = f.get_contents(['3', 'u'])
+        if not contents.get('u', []):
+            continue
+        if '3' not in contents:
+            found += [{ 'url': u.strip(' ') } for u in contents['u']]
+            continue
+        assert len(contents['3']) == 1
+        title = contents['3'][0].strip(' ')
+        found += [{ 'url': u.strip(' '), 'title': title  } for u in contents['u']]
+
+    return found
+
+def read_other_titles(rec):
+    return [' '.join(f.get_subfield_values(['a'])) for f in rec.get_fields('246')] \
+        + [' '.join(f.get_lower_subfields()) for f in rec.get_fields('730')] \
+        + [' '.join(f.get_subfield_values(['a', 'p', 'n'])) for f in rec.get_fields('740')]
+
+def read_location(rec):
+    fields = rec.get_fields('852')
+    if not fields:
+        return
+    found = set()
+    for f in fields:
+        found = found.union({v for v in f.get_subfield_values(['a']) if v})
+    return list(found)
+
+def read_contributions(rec):
+    """ Reads contributors from a MARC record
+    and use values in 7xx fields to set 'authors'
+    if the 1xx fields do not exist. Otherwise set
+    additional 'contributions'
+
+    :param (MarcBinary | MarcXml) rec:
+    :rtype: dict
+    """
+    want = dict((
+        ('700', 'abcdeq'),
+        ('710', 'ab'),
+        ('711', 'acdn'),
+        ('720', 'a'),
+    ))
+
+    ret = {}
+    skip_authors = set()
+    for tag in ('100', '110', '111'):
+        fields = rec.get_fields(tag)
+        for f in fields:
+            skip_authors.add(tuple(f.get_all_subfields()))
+
+    if not skip_authors:
+        for tag, f in rec.read_fields(['700', '710', '711', '720']):
+            f = rec.decode_field(f)
+            if tag in ('700', '720'):
+                if 'authors' not in ret or last_name_in_245c(rec, f):
+                    ret.setdefault('authors', []).append(read_author_person(f))
+                    skip_authors.add(tuple(f.get_subfields(want[tag])))
+                continue
+            elif 'authors' in ret:
+                break
+            if tag == '710':
+                name = [v.strip(' /,;:') for v in f.get_subfield_values(want[tag])]
+                ret['authors'] = [{ 'entity_type': 'org', 'name': remove_trailing_dot(' '.join(name))}]
+                skip_authors.add(tuple(f.get_subfields(want[tag])))
+                break
+            if tag == '711':
+                name = [v.strip(' /,;:') for v in f.get_subfield_values(want[tag])]
+                ret['authors'] = [{ 'entity_type': 'event', 'name': remove_trailing_dot(' '.join(name))}]
+                skip_authors.add(tuple(f.get_subfields(want[tag])))
+                break
+
+    for tag, f in rec.read_fields(['700', '710', '711', '720']):
+        sub = want[tag]
+        cur = tuple(rec.decode_field(f).get_subfields(sub))
+        if tuple(cur) in skip_authors:
+            continue
+        name = remove_trailing_dot(' '.join(strip_foc(i[1]) for i in cur).strip(','))
+        ret.setdefault('contributions', []).append(name) # need to add flip_name
+
+    return ret
+
+def read_toc(rec):
+    fields = rec.get_fields('505')
+
+    toc = []
+    for f in fields:
+        toc_line = []
+        for k, v in f.get_all_subfields():
+            if k == 'a':
+                toc_split = [i.strip() for i in v.split('--')]
+                if any(len(i) > 2048 for i in toc_split):
+                    toc_split = [i.strip() for i in v.split(' - ')]
+                # http://openlibrary.org/show-marc/marc_miami_univ_ohio/allbibs0036.out:3918815:7321
+                if any(len(i) > 2048 for i in toc_split):
+                    toc_split = [i.strip() for i in v.split('; ')]
+                # FIXME:
+                # http://openlibrary.org/show-marc/marc_western_washington_univ/wwu_bibs.mrc_revrev.mrc:938969487:3862
+                if any(len(i) > 2048 for i in toc_split):
+                    toc_split = [i.strip() for i in v.split(' / ')]
+                assert isinstance(toc_split, list)
+                toc.extend(toc_split)
+                continue
+            if k == 't':
+                if toc_line:
+                    toc.append(' -- '.join(toc_line))
+                if (len(v) > 2048):
+                    toc_line = [i.strip() for i in v.strip('/').split('--')]
+                else:
+                    toc_line = [v.strip('/')]
+                continue
+            toc_line.append(v.strip(' -'))
+        if toc_line:
+            toc.append('-- '.join(toc_line))
+    found = []
+    for i in toc:
+        if len(i) > 2048:
+            i = i.split('  ')
+            found.extend(i)
+        else:
+            found.append(i)
+    return [{'title': i, 'type': '/type/toc_item'} for i in found]
+
+def update_edition(rec, edition, func, field):
+    v = func(rec)
+    if v:
+        edition[field] = v
+
+re_bad_char = re.compile(u'[\xa0\xf6]')
+
+def read_edition(rec):
+    """
+    Converts MARC record object into a dict representation of an edition
+    suitable for importing into Open Library.
+
+    :param (MarcBinary | MarcXml) rec:
+    :rtype: dict
+    :return: Edition representation
+    """
+    handle_missing_008 = True
+    rec.build_fields(want)
+    edition = {}
+    tag_008 = rec.get_fields('008')
+    if len(tag_008) == 0:
+        if not handle_missing_008:
+            raise BadMARC("single '008' field required")
+    if len(tag_008) > 1:
+        len_40 = [f for f in tag_008 if len(f) == 40]
+        if len_40:
+            tag_008 = len_40
+        tag_008 = [min(tag_008, key=lambda f:f.count(' '))]
+    if len(tag_008) == 1:
+        #assert len(tag_008[0]) == 40
+        f = re_bad_char.sub(' ', tag_008[0])
+        if not f:
+            raise BadMARC("'008' field must not be blank")
+        publish_date = str(f)[7:11]
+
+        if publish_date.isdigit() and publish_date != '0000':
+            edition["publish_date"] = publish_date
+        if str(f)[6] == 't':
+            edition["copyright_date"] = str(f)[11:15]
+        publish_country = str(f)[15:18]
+        if publish_country not in ('|||', '   ', '\x01\x01\x01', '???'):
+            edition["publish_country"] = publish_country.strip()
+        lang = str(f)[35:38]
+        if lang not in ('   ', '|||', '', '???', 'zxx'):
+            # diebrokeradical400poll
+            if str(f)[34:37].lower() == 'eng':
+                lang = 'eng'
+            else:
+                lang = lang.lower()
+            edition['languages'] = [lang_map.get(lang, lang)]
+    else:
+        assert handle_missing_008
+        update_edition(rec, edition, read_languages, 'languages')
+        update_edition(rec, edition, read_pub_date, 'publish_date')
+
+    update_edition(rec, edition, read_lccn, 'lccn')
+    update_edition(rec, edition, read_authors, 'authors')
+    update_edition(rec, edition, read_oclc, 'oclc_numbers')
+    update_edition(rec, edition, read_lc_classification, 'lc_classifications')
+    update_edition(rec, edition, read_dewey, 'dewey_decimal_class')
+    update_edition(rec, edition, read_work_titles, 'work_titles')
+    update_edition(rec, edition, read_other_titles, 'other_titles')
+    update_edition(rec, edition, read_edition_name, 'edition_name')
+    update_edition(rec, edition, read_series, 'series')
+    update_edition(rec, edition, read_notes, 'notes')
+    update_edition(rec, edition, read_description, 'description')
+    update_edition(rec, edition, read_location, 'location')
+    update_edition(rec, edition, read_toc, 'table_of_contents')
+    update_edition(rec, edition, read_url, 'links')
+
+    edition.update(read_contributions(rec))
+    edition.update(subjects_for_work(rec))
+
+    try:
+        edition.update(read_title(rec))
+    except NoTitle:
+        if 'work_titles' in edition:
+            assert len(edition['work_titles']) == 1
+            edition['title'] = edition['work_titles'][0]
+            del edition['work_titles']
+        else:
+            raise
+
+    for func in (read_publisher, read_isbn, read_pagination):
+        v = func(rec)
+        if v:
+            edition.update(v)
+
+    return edition
diff --git a/ia-legacy-importer/marc/parse_xml.py b/ia-legacy-importer/marc/parse_xml.py
new file mode 100644
index 00000000..f3ef3d90
--- /dev/null
+++ b/ia-legacy-importer/marc/parse_xml.py
@@ -0,0 +1,99 @@
+from __future__ import print_function
+from lxml import etree
+import xml.parsers.expat
+from parse import read_edition
+from unicodedata import normalize
+
+import six
+
+slim = '{http://www.loc.gov/MARC21/slim}'
+leader_tag = slim + 'leader'
+data_tag = slim + 'datafield'
+control_tag = slim + 'controlfield'
+subfield_tag = slim + 'subfield'
+collection_tag = slim + 'collection'
+record_tag = slim + 'record'
+
+def norm(s):
+    return normalize('NFC', six.text_type(s))
+
+class BadSubtag:
+    pass
+
+class MultipleTitles:
+    pass
+
+class MultipleWorkTitles:
+    pass
+
+class datafield:
+    def __init__(self, element):
+        assert element.tag == data_tag
+        self.contents = {}
+        self.subfield_sequence = []
+        self.indicator1 = element.attrib['ind1']
+        self.indicator2 = element.attrib['ind2']
+        for i in element:
+            assert i.tag == subfield_tag
+            text = norm(i.text) if i.text else u''
+            if i.attrib['code'] == '':
+                raise BadSubtag
+            self.contents.setdefault(i.attrib['code'], []).append(text)
+            self.subfield_sequence.append((i.attrib['code'], text))
+
+class xml_rec:
+    def __init__(self, f):
+        self.root = etree.parse(f).getroot()
+        if self.root.tag == collection_tag:
+            assert self.root[0].tag == record_tag
+            self.root = self.root[0]
+        self.dataFields = {}
+        self.has_blank_tag = False
+        for i in self.root:
+            if i.tag == data_tag or i.tag == control_tag:
+                if i.attrib['tag'] == '':
+                    self.has_blank_tag = True
+                else:
+                    self.dataFields.setdefault(i.attrib['tag'], []).append(i)
+
+    def leader(self):
+        leader = self.root[0]
+        assert leader.tag == leader_tag
+        return norm(leader.text)
+
+    def fields(self):
+        return self.dataFields.keys()
+
+    def get_field(self, tag, default=None):
+        if tag not in self.dataFields:
+            return default
+        if tag == '245' and len(self.dataFields[tag]) > 1:
+            raise MultipleTitles
+        if tag == '240' and len(self.dataFields[tag]) > 1:
+            raise MultipleWorkTitles
+        if tag != '006':
+            assert len(self.dataFields[tag]) == 1
+        element = self.dataFields[tag][0]
+        if element.tag == control_tag:
+            return norm(element.text) if element.text else u''
+        if element.tag == data_tag:
+            return datafield(element)
+        return default
+
+    def get_fields(self, tag):
+        if tag not in self.dataFields:
+            return []
+        if self.dataFields[tag][0].tag == control_tag:
+            return [norm(i.text) if i.text else u'' for i in self.dataFields[tag]]
+        if self.dataFields[tag][0].tag == data_tag:
+            return [datafield(i) for i in self.dataFields[tag]]
+        return []
+
+def parse(f):
+    rec = xml_rec(f)
+    edition = {}
+    if rec.has_blank_tag:
+        print('has blank tag')
+    if rec.has_blank_tag or not read_edition(rec, edition):
+        return {}
+    return edition
diff --git a/ia-legacy-importer/marc/read_from_archive.py b/ia-legacy-importer/marc/read_from_archive.py
new file mode 100644
index 00000000..4420ecef
--- /dev/null
+++ b/ia-legacy-importer/marc/read_from_archive.py
@@ -0,0 +1,175 @@
+from __future__ import print_function
+import xml.etree.ElementTree as et
+from MARC21 import MARC21Record
+from MARC21Exn import MARC21Exn
+from time import sleep
+
+from six.moves import urllib
+
+
+archive_url = "http://archive.org/download/"
+
+def urlopen_keep_trying(url):
+    while True:
+        print(url)
+        try:
+            return urllib.request.urlopen(url)
+        except urllib.error.URLError:
+            pass
+        sleep(5)
+
+class FileWrapper(file):
+    def __init__(self, part):
+        self.fh = urlopen_keep_trying(archive_url + part)
+        self.pos = 0
+    def read(self, size):
+        self.pos += size
+        return self.fh.read(size)
+    def tell(self):
+        return self.pos
+    def close(self):
+        return self.fh.close()
+
+def files(archive_id):
+    url = archive_url + archive_id + "/" + archive_id + "_files.xml"
+    tree = et.parse(urlopen_keep_trying(url))
+    for i in tree.getroot():
+        assert i.tag == 'file'
+        name = i.attrib['name']
+        if name.endswith('.mrc') or name.endswith('.marc') or name.endswith('.out'):
+            yield archive_id + "/" + name
+
+def bad_data(i):
+    pass
+
+def read_marc_file(part, f, pos = 0):
+    buf = None
+    loc = None
+    while True:
+        if buf:
+            length = buf[:5]
+            int_length = int(length)
+        else:
+            length = f.read(5)
+            buf = length
+        if length == "":
+            break
+        assert length.isdigit()
+        int_length = int(length)
+        if 0 and part == 'marc_western_washington_univ/wwu_bibs.mrc_revrev.mrc':
+            if pos == 295782261:
+                int_length+=1
+            elif pos == 299825918:
+                int_length+=5
+        data = buf + f.read(int_length - len(buf))
+        buf = None
+        if data.find('\x1d') == -1:
+            data += f.read(40)
+            int_length = data.find('\x1d') + 1
+            print(repr(data[-40:]))
+            assert int_length
+            buf = data[int_length:]
+            data = data[:int_length]
+        assert data.endswith("\x1e\x1d")
+        if len(data) < int_length:
+            yield (loc, 'bad')
+            break
+        loc = "%s:%d:%d" % (part, pos, int_length)
+        pos += int_length
+        if str(data)[6:8] != 'am':
+            yield (loc, 'not_book')
+            continue
+        try:
+            rec = MARC21Record(data)
+        except IndexError:
+            rec = 'bad'
+        except TypeError:
+            rec = 'bad'
+        except ValueError:
+            rec = 'bad'
+        except EOFError:
+            print("EOF")
+            print(repr(data))
+            rec = 'bad'
+        except MARC21Exn:
+            rec = 'bad'
+        yield (loc, rec)
+
+#archive = [ "unc_catalog_marc", "marc_oregon_summit_records",
+#    "marc_university_of_toronto", "marc_miami_univ_ohio",
+#archive = [ "marc_western_washington_univ", "marc_boston_college" ]
+archive = [ "marc_western_washington_univ" ]
+#archive = [ "marc_boston_college" ]
+archive = [ "bcl_marc" ]
+
+# marc_university_of_toronto/uoft.marc:2568231948:707
+# marc_university_of_toronto/uoft.marc:2571412614:886
+
+# marc_western_washington_univ/wwu_bibs.mrc_revrev.mrc:286075909:955
+
+def check():
+    part = 'marc_boston_college/bc_openlibrary.mrc'
+    pos = 2147477123
+    part = 'marc_western_washington_univ/wwu_bibs.mrc_revrev.mrc'
+    pos = 295780665
+    pos = 395466242
+    pos = 495359719
+    pos = 778742194
+    pos = 875901953
+#    pos = 299825182
+#    pos = 298636444
+#    pos = 299562947
+#    pos = 299702849
+#    pos = 303085246
+    part = 'marc_records_scriblio_net/part10.dat'
+    pos = 99557594
+#    ureq = urllib.request.Request(archive_url + part, None, {'Range':'bytes=%d-%d'% (pos, pos+1000000000)} )
+#    f = urllib.request.urlopen(ureq)
+    f = urllib.request.urlopen(archive_url + part)
+
+    i = 0
+    total = 0
+    bad_record = []
+    not_interesting = 0
+    for loc, rec in read_marc_file(part, f, pos):
+        total+=1
+        if rec == 'not_book':
+            not_interesting += 1
+            continue
+        if rec == 'bad':
+            print('bad:', loc)
+            bad_record.append(loc)
+            continue
+    #    if str(rec.leader)[6:8] != 'am':
+    #        not_interesting += 1
+    #        continue
+        i+=1
+        if i % 1000 == 0:
+            print(i, loc)
+
+#check()
+
+for archive_id in archive:
+    i = 0
+    total = 0
+    bad_record = []
+    not_interesting = 0
+    print(archive_id)
+    for part in files(archive_id):
+        print(part)
+        f = urlopen_keep_trying(archive_url + part)
+        for loc, rec in read_marc_file(part, f):
+            total+=1
+            if rec == 'not_book':
+                not_interesting += 1
+                continue
+            if rec == 'bad':
+                print('bad:', loc)
+                bad_record.append(loc)
+                continue
+            i+=1
+            if i % 1000 == 0:
+                print(i, loc)
+    for loc in bad_record:
+        print(loc)
+    print(archive_id, total, i, not_interesting, len(bad_record))
diff --git a/ia-legacy-importer/marc/read_toc.py b/ia-legacy-importer/marc/read_toc.py
new file mode 100644
index 00000000..e02ae0b9
--- /dev/null
+++ b/ia-legacy-importer/marc/read_toc.py
@@ -0,0 +1,51 @@
+from __future__ import print_function
+from catalog.marc.fast_parse import get_all_subfields
+import re
+
+samples = [
+    "00\x1faDi 1 juan.Guo se tian xiang /Wu Jingsuo bian.Ba duan jin /Xingshizhushi bian ji --di 2 juan.Wu sheng xi ;Shi er lou /Li Yu --di 3 juan.Jin xiang ting /Su'anzhuren bian.\x1ftFen zhuang lou /Zhuxishanren --\x1fgdi 4 juan.Wu se shi /Bilian'gezhuren.Ba dong tian /Wuseshizhuren.Wu feng yin /Chichi dao ren bian zhu --di 5 juan.Shuang feng qi yuan /Xueqiaozhuren zi ding.Jin shi yuan.Qing meng tuo /Anyangjiumin --di 6 juan.Wu mei yuan.Xiu qiu yuan.Yuan yang ying /Qiaoyunshanren bian --di 7 juan.Mei ren shu /Xu Zhen.Wan hua lou /Li Yutang --di 8 juan.Bei shi yan yi /Du Gang.Kong kong huan /Wugangzhuren bian ci.Chun qiu pei --di 9 juan.Qian Qi guo zhi /Wumenxiaoke.Hou Qi guo zhi /Yanshuisanren.Qiao shi yan yi /Lu Yingyang --di 10 juan.Liaohai dan zhong lu /Lu Renlong.Tian bao tu.Jin xiu yi --di 11 juan.Shi mei tu.Huan xi yuan jia /Xihuyuyinzhuren.Feng liu he shang.Liang jiao hun /Tianhuazangzhuren --di 12 juan.Ge lian hua ying.Qi lou chong meng /Wang Lanzhi.\x1e",
+    '00\x1ftManierismus als Artistik : systematische Aspekte einer \xe8asthetischen Kategorie / R\xe8udiger Zymner -- "Stil" und "Manier" in der Alltagskultur / Kaspar Maase -- Die Wortfamilie von it. "Maniera" zwischen Literatur, bildender Kunst und Psychologie / Margarete Lindemann -- Der Manierismus : zur Problematik einer kunsthistorischen Erfindung / Horst Bredekamp -- Inszenierte K\xe8unstlichkeit : Musik als manieristisches Dispositiv / Hermann Danuser -- Manierismus als Stilbegriff in der Architekturgeschichte / Hermann Hipp -- "Raffael ohne H\xe8ande," oder, Das Kunstwerk zwischen Sch\xe8opfung und Fabrikation : Konzepte der "maniera" bei Vasari und seinen Zeitgenossen / Ursula Link-Heer -- "Sprezzatura" : Pontormos Portraits und das h\xe8ofische Ideal des Manierismus / Axel Christoph Gampp -- Maniera and the grotesque / Maria Fabricius Hansen -- Neulateinisches Figurengedicht und manieristische Poetik : zum "Poematum liber" (1573) des Richard Willis / Ulrich Ernst -- Manierismus als Selbstbehauptung, Jean Paul / Wolfgang Braungart --  Artistische Erkenntnis : (Sprach-)Alchimie und Manierismus in der Romantik / Axel Dunker -- "Als lebeten sie" / Holk Cruse.\x1e',
+]
+
+re_gt = re.compile('^(gt)+$')
+re_gtr = re.compile('^(gtr)+$')
+re_at = re.compile('^at+$')
+re_end_num = re.compile('\d[]. ]*$')
+for line in open('test_data/marc_toc'):
+    (loc, line) = eval(line)
+    #print loc
+    subfields = list(get_all_subfields(line))
+    if subfields[0][0] == '6':
+        subfields.pop(0)
+    subtags = ''.join(k for k, v in subfields)
+    if re_at.match(subtags):
+        a = subfields[0][1]
+        m = re_end_num.search(a)
+        print((bool(m), repr(a)))
+        continue
+
+        if not m:
+            for k, v in subfields:
+                print((k, repr(v)))
+        assert m
+    continue
+    if re_gtr.match(subtags):
+        continue
+        for i in range(len(subfields)/3):
+            g = subfields[i * 3][1]
+            t = subfields[i * 3 + 1][1].strip('- /')
+            r = subfields[i * 3 + 2][1].strip('- ')
+            print(repr(g, t, r))
+        continue
+    if re_gt.match(subtags):
+        continue
+        for i in range(len(subfields)/2):
+            g = subfields[i * 2][1]
+            t = subfields[i * 2 + 1][1].strip('- /')
+            print(repr(g, t))
+        print()
+        continue
+    print(subtags)
+    for k, v in subfields:
+        print((k, repr(v)))
+    print()
diff --git a/ia-legacy-importer/marc/schema.sql b/ia-legacy-importer/marc/schema.sql
new file mode 100644
index 00000000..c5e8d1dd
--- /dev/null
+++ b/ia-legacy-importer/marc/schema.sql
@@ -0,0 +1,33 @@
+create table files (
+    id serial,
+    part varchar(80)
+);
+
+create table recs (
+    id serial,
+    marc_file integer,
+    pos bigint,
+    len integer
+);
+    
+create table isbn (
+    rec integer,
+    value varchar(16)
+);
+
+create table oclc (
+    rec integer,
+    value varchar(32)
+);
+
+create table title (
+    rec integer,
+    value varchar(25)
+);
+
+create table lccn (
+    rec integer,
+    value varchar(32)
+);
+
+
diff --git a/ia-legacy-importer/marc/show_records.py b/ia-legacy-importer/marc/show_records.py
new file mode 100644
index 00000000..a05609a7
--- /dev/null
+++ b/ia-legacy-importer/marc/show_records.py
@@ -0,0 +1,22 @@
+#!/usr/bin/python2.5
+from __future__ import print_function
+from openlibrary.catalog.marc.fast_parse import *
+import sys
+from collections import defaultdict
+
+# read a MARC binary showing one record at a time
+
+field_counts = defaultdict(int)
+
+for data, length in read_file(open(sys.argv[1])):
+    print(data[:24])
+    is_marc8 = data[9] != 'a'
+    for tag, line in get_all_tag_lines(data):
+        if tag.startswith('00'):
+            print(tag, line[:-1])
+        else:
+            print(tag, list(get_all_subfields(line, is_marc8)))
+        field_counts[tag] += 1
+    print()
+    print(dict(field_counts))
+    print()
diff --git a/ia-legacy-importer/marc/sources b/ia-legacy-importer/marc/sources
new file mode 100644
index 00000000..645e899d
--- /dev/null
+++ b/ia-legacy-importer/marc/sources
@@ -0,0 +1,14 @@
+marc_oregon_summit_records	Oregon Summit
+marc_miami_univ_ohio	Miami University
+marc_western_washington_univ	Western Washington University
+bcl_marc	Boston College
+bpl_marc	Boston Public Library
+talis_openlibrary_contribution	Talis
+unc_catalog_marc	University of North Carolina at Chapel Hill
+marc_records_scriblio_net	Library of Congress
+marc_university_of_toronto	University of Toronto
+marc_loc_updates	Library of Congress updates
+marc_laurentian	Laurentian
+CollingswoodLibraryMarcDump10-27-2008	Collingswood Public Library
+marc_binghamton_univ	Binghamton University Libraries
+hollis_marc	Harvard University
diff --git a/ia-legacy-importer/marc/sources.py b/ia-legacy-importer/marc/sources.py
new file mode 100644
index 00000000..6927a5ab
--- /dev/null
+++ b/ia-legacy-importer/marc/sources.py
@@ -0,0 +1,11 @@
+import sys
+import os
+
+def find_sources():
+    for p in sys.path:
+        f = p + "/catalog/marc/sources"
+        if os.path.exists(f):
+            return f
+
+def sources():
+    return [tuple(i[:-1].split('\t')) for i in open(find_sources())]
diff --git a/ia-legacy-importer/marc/tests/test_fast_parse.py b/ia-legacy-importer/marc/tests/test_fast_parse.py
new file mode 100644
index 00000000..2cfecb30
--- /dev/null
+++ b/ia-legacy-importer/marc/tests/test_fast_parse.py
@@ -0,0 +1,26 @@
+# -*- coding: UTF-8 -*-
+import os
+import pytest
+
+from openlibrary.catalog.marc.fast_parse import index_fields, get_tag_lines, read_edition
+
+test_data = "%s/test_data/bin_input/" % os.path.dirname(__file__)
+
+@pytest.mark.skip
+def test_read_oclc():
+    # DEPRECATED data was 'oregon_27194315', triggers exception
+    for f in ('scrapbooksofmoun03tupp_meta.mrc',):
+        data = open(test_data + f).read()
+        i = index_fields(data, ['001', '003', '010', '020', '035', '245'])
+        assert 'oclc' in i
+        e = read_edition(data)
+        assert 'oclc' in e
+
+@pytest.mark.skip
+def test_ia_charset():
+    # Tests a corrupted unicode MARC record is corrected, does code exist to fix this?
+    data = open(test_data + 'histoirereligieu05cr_meta.mrc').read()
+    line = list(get_tag_lines(data, set(['100'])))[0][1]
+    a = list(get_all_subfields(line))[0][1]
+    expect = u'Crétineau-Joly, J.'
+    assert a == expect
diff --git a/ia-legacy-importer/marc/tests/test_marc.py b/ia-legacy-importer/marc/tests/test_marc.py
new file mode 100644
index 00000000..665ad72e
--- /dev/null
+++ b/ia-legacy-importer/marc/tests/test_marc.py
@@ -0,0 +1,149 @@
+import unittest
+from openlibrary.catalog.marc.get_subjects import subjects_for_work
+from openlibrary.catalog.marc.marc_base import MarcBase
+from openlibrary.catalog.marc.parse import read_isbn, read_pagination, read_title
+
+class MockField:
+    def __init__(self, subfields):
+        self.subfield_sequence = subfields
+        self.contents = {}
+        for k, v in subfields:
+            self.contents.setdefault(k, []).append(v)
+
+    def get_contents(self, want):
+        contents = {}
+        for k, v in self.get_subfields(want):
+            if v:
+                contents.setdefault(k, []).append(v)
+        return contents
+
+    def get_all_subfields(self):
+        return self.get_subfields(self.contents.keys())
+
+    def get_subfields(self, want):
+        for w in want:
+           if w in self.contents:
+               for i in self.contents.get(w):
+                   yield w, i
+
+    def get_subfield_values(self, want):
+        return [v for k, v in self.get_subfields(want)]
+
+class MockRecord(MarcBase):
+    """ usage: MockRecord('020', [('a', 'value'), ('c', 'value'), ('c', 'value')])
+        Currently only supports a single tag per Record."""
+    def __init__(self, marc_field, subfields):
+        self.tag = marc_field
+        self.field = MockField(subfields)
+
+    def decode_field(self, field):
+        return field
+
+    def read_fields(self, want):
+        if self.tag in want:
+            yield self.tag, self.field
+
+    def get_fields(self, tag):
+        if tag == self.tag:
+            return [self.field]
+
+# TODO: refactor to not use unittest
+class TestMarcParse(unittest.TestCase):
+    def test_read_isbn(self):
+        data = [
+            ('0300067003 (cloth : alk. paper)', '0300067003'),
+            ('0197263771 (cased)', '0197263771'),
+            ('8831789589 (pbk.)', '8831789589'),
+            ('9788831789585 (pbk.)', '9788831789585'),
+            ('1402051891 (hd.bd.)', '1402051891'),
+            ('9061791308', '9061791308'),
+            ('9788831789530', '9788831789530'),
+            ('8831789538', '8831789538'),
+            ('0-14-118250-4', '0141182504'),
+            ('0321434250 (textbook)', '0321434250'),
+            # 12 character ISBNs currently get assigned to isbn_10
+            # unsure whether this is a common / valid usecase:
+            ('97883178953X ', '97883178953X'),
+        ]
+
+        for (value, expect) in data:
+            rec = MockRecord('020', [('a', value)])
+            output = read_isbn(rec)
+            if len(expect) == 13:
+                isbn_type = 'isbn_13'
+            else:
+                isbn_type = 'isbn_10'
+            self.assertEqual(expect, output[isbn_type][0])
+
+    def test_read_pagination(self):
+        data = [
+            ('xx, 1065 , [57] p.', 1065),
+            ('193 p., 31 p. of plates', 193),
+        ]
+        for (value, expect) in data:
+            rec = MockRecord('300', [('a', value)])
+            output = read_pagination(rec)
+            self.assertEqual(output['number_of_pages'], expect)
+            self.assertEqual(output['pagination'], value)
+
+    def test_subjects_for_work(self):
+        data = [
+            ([  ('a', 'Authors, American'),
+                ('y', '19th century'),
+                ('x', 'Biography.')],
+                {'subject_times': ['19th century'],
+                 'subjects': ['American Authors', 'Biography']}),
+            ([  ('a', 'Western stories'),
+                ('x', 'History and criticism.')],
+                {'subjects': ['Western stories', 'History and criticism']}),
+            ([  ('a', 'United States'),
+                ('x', 'History'),
+                ('y', 'Revolution, 1775-1783'),
+                ('x', 'Influence.')],
+                # TODO: this expectation does not capture the intent or ordering of the original MARC, investigate x subfield!
+                {'subject_times': ['Revolution, 1775-1783'], 'subjects': ['United States', 'Influence', 'History']}),
+                # 'United States -- History -- Revolution, 1775-1783 -- Influence.'
+            ([  ('a', 'West Indies, British'),
+                ('x', 'History'),
+                ('y', '18th century.')],
+                {'subject_times': ['18th century'], 'subjects': ['British West Indies', 'History']}),
+                # 'West Indies, British -- History -- 18th century.'),
+            ([  ('a', 'Great Britain'),
+                ('x', 'Relations'),
+                ('z', 'West Indies, British.')],
+                {'subject_places': ['British West Indies'], 'subjects': ['Great Britain', 'Relations']}),
+                #'Great Britain -- Relations -- West Indies, British.'),
+            ([  ('a', 'West Indies, British'),
+                ('x', 'Relations'),
+                ('z', 'Great Britain.')],
+                {'subject_places': ['Great Britain'], 'subjects': ['British West Indies', 'Relations']})
+                #'West Indies, British -- Relations -- Great Britain.')
+        ]
+        for (value, expect) in data:
+            output = subjects_for_work(MockRecord('650', value))
+            self.assertEqual(expect, output)
+
+    def test_read_title(self):
+        data = [
+            ([  ('a', 'Railroad construction.'),
+                ('b', 'Theory and practice.'),
+                ('b', 'A textbook for the use of students in colleges and technical schools.')],
+                {'title': 'Railroad construction',
+                # TODO: Investigate whether this colon between subtitles is spaced correctly
+                 'subtitle': 'Theory and practice : A textbook for the use of students in colleges and technical schools'})
+        ]
+
+        for (value, expect) in data:
+            output = read_title(MockRecord('245', value))
+            self.assertEqual(expect, output)
+
+    def test_by_statement(self):
+        data = [
+            ([  ('a', u'Trois contes de No\u0308el'),
+                ('c', u'[par] Madame Georges Renard,'),
+                ('c', u'edited by F. Th. Meylan ...')],
+                {'title': u'Trois contes de No\u0308el', 'by_statement': '[par] Madame Georges Renard, edited by F. Th. Meylan ...'})
+        ]
+        for (value, expect) in data:
+            output = read_title(MockRecord('245', value))
+            self.assertEqual(expect, output)
diff --git a/ia-legacy-importer/marc/tests/test_marc_binary.py b/ia-legacy-importer/marc/tests/test_marc_binary.py
new file mode 100644
index 00000000..29c442da
--- /dev/null
+++ b/ia-legacy-importer/marc/tests/test_marc_binary.py
@@ -0,0 +1,59 @@
+# -*- coding: UTF-8 -*-
+import os
+
+from openlibrary.catalog.marc.marc_binary import BinaryDataField, MarcBinary
+
+test_data = "%s/test_data/bin_input/" % os.path.dirname(__file__)
+
+class MockMARC:
+    def __init__(self, leader_9):
+        # 'a' for utf-8, ' ' for MARC8
+        self.leader_9 = leader_9
+
+    def leader(self):
+        return '#' * 9 + self.leader_9
+
+
+def test_wrapped_lines():
+    filename = '%s/wrapped_lines' % test_data
+    with open(filename, 'r') as f:
+        rec = MarcBinary(f.read())
+        ret = list(rec.read_fields(['520']))
+        assert len(ret) == 2
+        a, b = ret
+        assert a[0] == '520' and b[0] == '520'
+        a_content = list(a[1].get_all_subfields())[0][1]
+        assert len(a_content) == 2290
+        b_content = list(b[1].get_all_subfields())[0][1]
+        assert len(b_content) == 243
+
+
+class Test_BinaryDataField:
+    def test_translate(self):
+        bdf = BinaryDataField(MockMARC(' '), '')
+        assert bdf.translate('Vieira, Claudio Bara\xe2una,') == u'Vieira, Claudio Baraúna,'
+
+    def test_bad_marc_line(self):
+        line = '0 \x1f\xe2aEtude objective des ph\xe2enom\xe1enes neuro-psychiques;\x1e'
+        bdf = BinaryDataField(MockMARC(' '), line)
+        assert list(bdf.get_all_subfields()) == [(u'á', u'Etude objective des phénomènes neuro-psychiques;')]
+
+class Test_MarcBinary:
+    def test_all_fields(self):
+        filename = '%s/onquietcomedyint00brid_meta.mrc' % test_data
+        with open(filename, 'r') as f:
+            rec = MarcBinary(f.read())
+            fields = list(rec.all_fields())
+            assert len(fields) == 13
+            assert fields[0][0] == '001'
+            for f,v in fields:
+                if f == '001':
+                    f001 = v
+                elif f == '008':
+                    f008 = v
+                elif f == '100':
+                    f100 = v
+            assert isinstance(f001, str)
+            assert isinstance(f008, str)
+            assert isinstance(f100, BinaryDataField)
+
diff --git a/ia-legacy-importer/marc/tests/test_parse.py b/ia-legacy-importer/marc/tests/test_parse.py
new file mode 100644
index 00000000..e81be9f1
--- /dev/null
+++ b/ia-legacy-importer/marc/tests/test_parse.py
@@ -0,0 +1,98 @@
+import pytest
+
+from openlibrary.catalog.marc.parse import read_edition, SeeAlsoAsTitle, NoTitle
+from openlibrary.catalog.marc.marc_binary import MarcBinary
+from openlibrary.catalog.marc.marc_xml import MarcXml, BadSubtag, BlankTag
+from lxml import etree
+import os
+import simplejson
+
+collection_tag = '{http://www.loc.gov/MARC21/slim}collection'
+record_tag = '{http://www.loc.gov/MARC21/slim}record'
+
+xml_samples = ['39002054008678.yale.edu', 'flatlandromanceo00abbouoft',
+    'nybc200247', 'secretcodeofsucc00stjo', 'warofrebellionco1473unit',
+    'zweibchersatir01horauoft', 'onquietcomedyint00brid', '00schlgoog',
+    '0descriptionofta1682unit', '1733mmoiresdel00vill', '13dipolarcycload00burk',
+    'bijouorannualofl1828cole', 'soilsurveyrepor00statgoog', 'diebrokeradical400poll',
+    'cu31924091184469', # MARC XML collection record
+    'engineercorpsofh00sher',
+    ]
+
+bin_samples = [
+    'bijouorannualofl1828cole_meta.mrc', 'onquietcomedyint00brid_meta.mrc',  # LCCN with leading characters
+    'merchantsfromcat00ben_meta.mrc', 'memoirsofjosephf00fouc_meta.mrc',  # MARC8 encoded with e-acute
+    'bpl_0486266893', 'flatlandromanceo00abbouoft_meta.mrc',
+    'histoirereligieu05cr_meta.mrc', 'ithaca_college_75002321', 'lc_0444897283',
+    'lc_1416500308', 'ocm00400866', 'secretcodeofsucc00stjo_meta.mrc',
+    'uoft_4351105_1626', 'warofrebellionco1473unit_meta.mrc', 'wrapped_lines',
+    'wwu_51323556', 'zweibchersatir01horauoft_meta.mrc', 'talis_two_authors.mrc',
+    'talis_no_title.mrc', 'talis_740.mrc', 'talis_245p.mrc', 'talis_856.mrc',
+    'talis_multi_work_tiles.mrc', 'talis_empty_245.mrc', 'ithaca_two_856u.mrc',
+    'collingswood_bad_008.mrc', 'collingswood_520aa.mrc', 'upei_broken_008.mrc',
+    'upei_short_008.mrc', 'diebrokeradical400poll_meta.mrc', 'cu31924091184469_meta.mrc',
+    'engineercorpsofh00sher_meta.mrc', 'henrywardbeecher00robauoft_meta.mrc',
+    'thewilliamsrecord_vol29b_meta.mrc', '13dipolarcycload00burk_meta.mrc' ]
+
+test_data = "%s/test_data" % os.path.dirname(__file__)
+
+class TestParseMARCXML:
+    @pytest.mark.parametrize('i', xml_samples)
+    def test_xml(self, i):
+        expect_filename = "%s/xml_expect/%s_marc.xml" % (test_data, i)
+        path            = "%s/xml_input/%s_marc.xml"  % (test_data, i)
+        element = etree.parse(open(path)).getroot()
+        # Handle MARC XML collection elements in our test_data expectations:
+        if element.tag == collection_tag and element[0].tag == record_tag:
+            element = element[0]
+        rec = MarcXml(element)
+        edition_marc_xml = read_edition(rec)
+        assert edition_marc_xml
+        j = simplejson.load(open(expect_filename))
+        assert j, 'Unable to open test data: %s' % expect_filename
+        assert sorted(edition_marc_xml.keys()) == sorted(j.keys()), 'Processed MARCXML fields do not match expectations in %s' % expect_filename
+        for k in edition_marc_xml.keys():
+            assert edition_marc_xml[k] == j[k], 'Processed MARCXML values do not match expectations in %s' % expect_filename
+        assert edition_marc_xml == j
+
+
+class TestParseMARCBinary:
+    @pytest.mark.parametrize('i', bin_samples)
+    def test_binary(self, i):
+        expect_filename = "%s/bin_expect/%s" % (test_data, i)
+        data = open("%s/bin_input/%s" % (test_data, i)).read()
+        if len(data) != int(data[:5]):
+            #TODO: Why are we fixing this in test expectations? Investigate.
+            #      affects histoirereligieu05cr_meta.mrc and zweibchersatir01horauoft_meta.mrc
+            data = data.decode('utf-8').encode('raw_unicode_escape')
+        assert len(data) == int(data[:5])
+        rec = MarcBinary(data)
+        edition_marc_bin = read_edition(rec)
+        assert edition_marc_bin
+        if not os.path.exists(expect_filename):
+            # Missing test expectations file. Create a template from the input, but fail the current test.
+            simplejson.dump(edition_marc_bin, open(expect_filename, 'w'), indent=2)
+            assert False, 'Expectations file %s not found: template generated in %s. Please review and commit this file.' % (expect_filename, '/bin_expect')
+        j = simplejson.load(open(expect_filename))
+        assert j, 'Unable to open test data: %s' % expect_filename
+        assert sorted(edition_marc_bin.keys()) == sorted(j.keys()), 'Processed binary MARC fields do not match expectations in %s' % expect_filename
+        for k in edition_marc_bin.keys():
+            if isinstance(j[k], list):
+                for item1, item2 in zip(edition_marc_bin[k], j[k]):
+                    assert item1 == item2
+            assert edition_marc_bin[k] == j[k], 'Processed binary MARC values do not match expectations in %s' % expect_filename
+        assert edition_marc_bin == j
+
+    def test_raises_see_also(self):
+        filename = '%s/bin_input/talis_see_also.mrc' % test_data
+        with open(filename, 'r') as f:
+            rec = MarcBinary(f.read())
+        with pytest.raises(SeeAlsoAsTitle):
+            read_edition(rec)
+
+    def test_raises_no_title(self):
+        filename = '%s/bin_input/talis_no_title2.mrc' % test_data
+        with open(filename, 'r') as f:
+            rec = MarcBinary(f.read())
+        with pytest.raises(NoTitle):
+            read_edition(rec)
diff --git a/ia-legacy-importer/marc/tests/test_work_subject.py b/ia-legacy-importer/marc/tests/test_work_subject.py
new file mode 100644
index 00000000..097de584
--- /dev/null
+++ b/ia-legacy-importer/marc/tests/test_work_subject.py
@@ -0,0 +1,121 @@
+from openlibrary.catalog.marc.marc_xml import MarcXml, BadSubtag, BlankTag
+from openlibrary.catalog.marc.marc_binary import MarcBinary
+from openlibrary.catalog.marc.marc_subject import read_subjects, tidy_subject, four_types
+from collections import defaultdict
+from lxml import etree
+import os
+import pytest
+
+xml_samples = [
+    ('bijouorannualofl1828cole', {}),
+    ('flatlandromanceo00abbouoft', {}),
+    ('lesabndioeinas00sche', {}),
+    ('onquietcomedyint00brid', {}),
+    ('zweibchersatir01horauoft', {}),
+
+    ('00schlgoog',
+        {'subject': {u'Jewish law': 1}}),
+    ('0descriptionofta1682unit', {
+        'place': {u'United States': 1},
+        'subject': {u"Decedents' estates": 1, u'Taxation': 1, u'S. 1983 97th Congress': 1, u'S. 2479 97th Congress': 1}
+    }),
+    ('13dipolarcycload00burk',
+        {'subject': {u'Allene': 1, u'Ring formation (Chemistry)': 1, u'Trimethylenemethane': 1}}),
+    ('1733mmoiresdel00vill',
+        {'place': {u'Spain': 1}, 'subject': {u'Courts and court life': 1, u'History': 1}}),
+    ('39002054008678.yale.edu',
+        {'place': {u'Ontario': 2}, 'subject': {u'Description and travel': 1, u'History': 1}}),
+    ('abhandlungender01ggoog',
+        {'place': {u'Lusatia': 1, u'Germany': 1}, 'subject': {u'Natural history': 2, u'Periodicals': 1}}),
+    ('nybc200247',
+        {'person': {u'Simon Dubnow (1860-1941)': 1}, 'subject': {u'Philosophy': 1, u'Jews': 1, u'History': 1}}),
+    ('scrapbooksofmoun03tupp', {
+        'person': {u'William Vaughn Tupper (1835-1898)': 1},
+        'subject': {u'Photographs': 4, u'Sources': 1, u'Description and travel': 2, u'Travel': 1, u'History': 1, u'Travel photography': 1},
+        'place': {u'Europe': 3, u'Egypt': 2},
+        'time': {u'19th century': 1}}),
+    ('secretcodeofsucc00stjo',
+        {'subject': {u'Success in business': 1}}),
+    ('warofrebellionco1473unit', {
+        'time': {u'Civil War, 1861-1865': 2},
+        'place': {u'United States': 2, u'Confederate States of America': 1},
+        'subject': {u'Sources': 2, u'Regimental histories': 1, u'History': 3}}),
+]
+
+bin_samples = [
+    ('bpl_0486266893', {}),
+    ('flatlandromanceo00abbouoft_meta.mrc', {}),
+    ('lc_1416500308', {}),
+    ('talis_245p.mrc', {}),
+    ('talis_740.mrc', {}),
+    ('talis_empty_245.mrc', {}),
+    ('talis_multi_work_tiles.mrc', {}),
+    ('talis_no_title2.mrc', {}),
+    ('talis_no_title.mrc', {}),
+    ('talis_see_also.mrc', {}),
+    ('talis_two_authors.mrc', {}),
+    ('zweibchersatir01horauoft_meta.mrc', {}),
+
+    ('1733mmoiresdel00vill_meta.mrc',
+        {'place': {u'Spain': 1}, 'subject': {u'Courts and court life': 1, u'History': 1}}),
+    ('collingswood_520aa.mrc',
+        {'subject': {u'Learning disabilities': 1, u'People with disabilities': 1, u'Talking books': 1, u'Juvenile literature': 1, u'Juvenile fiction': 3, u'Friendship': 1}}),
+    ('collingswood_bad_008.mrc',
+        {'subject': {u'War games': 1, u'Battles': 1}}),
+    ('histoirereligieu05cr_meta.mrc',
+        {'org': {u'Jesuits': 4}, 'subject': {u'Influence': 1, u'History': 1}}),
+    ('ithaca_college_75002321', {
+        'place': {u'New Jersey': 3},
+        'subject': {u'Congresses': 3, u'Negative income tax': 1, u'Guaranteed annual income': 1, u'Labor supply': 1}}),
+    ('ithaca_two_856u.mrc', {
+        'place': {u'Great Britain': 2},
+        'subject': {u'Statistics': 1, u'Periodicals': 2}}),
+    ('lc_0444897283',
+        {'subject': {u'Shipyards': 1, u'Shipbuilding': 1, u'Data processing': 2, u'Congresses': 3, u'Naval architecture': 1, u'Automation': 1}}),
+    ('ocm00400866',
+        {'subject': {u'School songbooks': 1, u'Choruses (Mixed voices) with piano': 1}}),
+    ('scrapbooksofmoun03tupp_meta.mrc', {
+        'person': {u'William Vaughn Tupper (1835-1898)': 1},
+        'subject': {u'Photographs': 4, u'Sources': 1, u'Description and travel': 2, u'Travel': 1, u'History': 1, u'Travel photography': 1},
+        'place': {u'Europe': 3, u'Egypt': 2},
+        'time': {u'19th century': 1}}),
+    ('secretcodeofsucc00stjo_meta.mrc',
+        {'subject': {u'Success in business': 1}}),
+    ('talis_856.mrc',
+        {'subject': {u'Politics and government': 1, u'Jewish-Arab relations': 1, u'Middle East': 1, u'Arab-Israeli conflict': 1}, 'time': {u'1945-': 1}}),
+    ('uoft_4351105_1626',
+        {'subject': {u'Aesthetics': 1, u'History and criticism': 1}}),
+    ('upei_broken_008.mrc',
+        {'place': {u'West Africa': 1}, 'subject': {u'Social life and customs': 1}}),
+    ('upei_short_008.mrc',
+        {'place': {u'Charlottetown (P.E.I.)': 1, u'Prince Edward Island': 1}, 'subject': {u'Social conditions': 1, u'Economic conditions': 1, u'Guidebooks': 1, u'Description and travel': 2}}),
+    ('warofrebellionco1473unit_meta.mrc',
+        {'time': {u'Civil War, 1861-1865': 2}, 'place': {u'United States': 2, u'Confederate States of America': 1}, 'subject': {u'Sources': 2, u'Regimental histories': 1, u'History': 3}}),
+    ('wrapped_lines',
+        {'org': {u'United States': 1, u'United States. Congress. House. Committee on Foreign Affairs': 1}, 'place': {u'United States': 1}, 'subject': {u'Foreign relations': 1}}),
+    ('wwu_51323556',
+        {'subject': {u'Statistical methods': 1, u'Spatial analysis (Statistics)': 1, u'Population geography': 1}}),
+]
+
+record_tag = '{http://www.loc.gov/MARC21/slim}record'
+
+class TestSubjects:
+
+    @pytest.mark.parametrize('item,expected', xml_samples)
+    def test_subjects_xml(self, item, expected):
+        filename = os.path.dirname(__file__) + '/test_data/xml_input/' + item + '_marc.xml'
+        element = etree.parse(filename).getroot()
+        if element.tag != record_tag and element[0].tag == record_tag:
+            element = element[0]
+        rec = MarcXml(element)
+        assert read_subjects(rec) == expected
+
+    @pytest.mark.parametrize('item,expected', bin_samples)
+    def test_subjects_bin(self, item, expected):
+        filename = os.path.dirname(__file__) + '/test_data/bin_input/' + item
+
+        data = open(filename).read()
+        if len(data) != int(data[:5]):
+            data = data.decode('utf-8').encode('raw_unicode_escape')
+        rec = MarcBinary(data)
+        assert read_subjects(rec) == expected
diff --git a/ia-legacy-importer/merge/__init__.py b/ia-legacy-importer/merge/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/ia-legacy-importer/merge/amazon.py b/ia-legacy-importer/merge/amazon.py
new file mode 100644
index 00000000..36b0952f
--- /dev/null
+++ b/ia-legacy-importer/merge/amazon.py
@@ -0,0 +1,291 @@
+from __future__ import print_function
+import re
+import warnings
+
+from openlibrary.catalog.merge.names import match_name
+from openlibrary.catalog.merge.normalize import normalize
+
+re_year = re.compile(r'(\d{4})$')
+re_amazon_title_paren = re.compile(r'^(.*) \([^)]+?\)$')
+re_and_of_space = re.compile(' and | of | ')
+
+isbn_match = 85
+
+
+def set_isbn_match(score):
+    isbn_match = score
+
+
+def amazon_year(date):
+    m = re_year.search(date)
+    assert m
+    year = m.group(1)
+    return year
+
+
+def build_amazon(edition, authors):
+    amazon = build_titles(full_title(edition))
+    amazon['isbn'] = edition['isbn_10']
+    if 'publish_date' in edition:
+        amazon['publish_date'] = amazon_year(edition['publish_date'])
+    if authors:
+        amazon['authors'] = authors
+    else:
+        amazon['authors'] = []
+    if 'number_of_pages' in edition:
+        amazon['number_of_pages'] = edition['number_of_pages']
+    if 'publishers' in edition:
+        amazon['publishers'] = edition['publishers']
+    return amazon
+
+
+def build_titles(title):
+    warnings.warn('Deprecated, use openlibrary.catalog.merge.merge_marc.build_titles() instead.', DeprecationWarning)
+
+    normalized_title = normalize(title).lower()
+    titles = [ title, normalized_title ];
+    if title.find(' & ') != -1:
+        t = title.replace(" & ", " and ")
+        titles.append(t)
+        titles.append(normalize(t))
+    t2 = []
+    for t in titles:
+        if t.lower().startswith('the '):
+            t2.append(t[4:])
+        elif t.lower().startswith('a '):
+            t2.append(t[2:])
+    titles += t2
+
+    if re_amazon_title_paren.match(title):
+        t2 = []
+        for t in titles:
+            m = re_amazon_title_paren.match(t)
+            if m:
+                t2.append(m.group(1))
+                t2.append(normalize(m.group(1)))
+        titles += t2
+
+    return {
+        'full_title':       title,
+        'normalized_title': normalized_title,
+        'titles':           titles,
+        'short_title':      normalized_title[:25],
+    }
+
+def within(a, b, distance):
+    return abs(a-b) <= distance
+
+def compare_date(e1, e2):
+    if 'publish_date' not in e1 or 'publish_date' not in e2:
+        return ('publish_date', 'value missing', 0)
+    if e1['publish_date'] == e2['publish_date']:
+        return ('publish_date', 'exact match', 200)
+    try:
+        e1_pub = int(e1['publish_date'])
+        e2_pub = int(e2['publish_date'])
+        if within(e1_pub, e2_pub, 1):
+            return ('publish_date', 'within 1 year', 100)
+        elif within(e1_pub, e2_pub, 2):
+            return ('publish_date', '+/-2 years', -25)
+        else:
+            return ('publish_date', 'mismatch', -250)
+    except ValueError as TypeError:
+        return ('publish_date', 'mismatch', -250)
+
+def compare_isbn10(e1, e2):
+    warnings.warn('Deprecated, use openlibrary.catalog.merge.merge_marc.compare_isbn10() instead.', DeprecationWarning)
+
+    if len(e1['isbn']) == 0 or len(e2['isbn']) == 0:
+        return ('isbn', 'missing', 0)
+    for i in e1['isbn']:
+        for j in e2['isbn']:
+            if i == j:
+                return ('isbn', 'match', isbn_match)
+    return ('ISBN', 'mismatch', -225)
+
+def level1_merge(e1, e2):
+    warnings.warn('Deprecated, use openlibrary.catalog.merge.merge_marc.level1_merge() instead.', DeprecationWarning)
+
+    score = []
+    if e1['short_title'] == e2['short_title']:
+        score.append(('short_title', 'match', 450))
+    else:
+        score.append(('short_title', 'mismatch', 0))
+
+    score.append(compare_date(e1, e2))
+    score.append(compare_isbn10(e1, e2))
+    return score
+
+def compare_authors(amazon, marc):
+    warnings.warn('Deprecated, use openlibrary.catalog.merge.merge_marc.compare_authors() instead.', DeprecationWarning)
+
+    if len(amazon['authors']) == 0 and 'authors' not in marc:
+        return ('authors', 'no authors', 75)
+    if len(amazon['authors']) == 0:
+        return ('authors', 'field missing from one record', -25)
+
+    for name in amazon['authors']:
+        if 'authors' in marc and match_name(name, marc['authors'][0]['name']):
+            return ('authors', 'exact match', 125)
+        if 'by_statement' in marc and marc['by_statement'].find(name) != -1:
+            return ('authors', 'exact match', 125)
+    if 'authors' not in marc:
+        return ('authors', 'field missing from one record', -25)
+
+    max_score = 0
+    for a in amazon['authors']:
+        percent, ordered = keyword_match(a[0], marc['authors'][0]['name'])
+        if percent > 0.50:
+            score = percent * 80
+            if ordered:
+                score += 10
+            if score > max_score:
+                max_score = score
+    if max_score:
+        return ('authors', 'keyword match', max_score)
+    else:
+        return ('authors', 'mismatch', -200)
+
+def title_replace_amp(amazon):
+    return normalize(amazon['full-title'].replace(" & ", " and ")).lower()
+
+def substr_match(a, b):
+    return a.find(b) != -1 or b.find(a) != -1
+
+def keyword_match(in1, in2):
+    s1, s2 = [i.split() for i in (in1, in2)]
+    s1_set = set(s1)
+    s2_set = set(s2)
+    match = s1_set & s2_set
+    if len(s1) == 0 and len(s2) == 0:
+        return 0, True
+    ordered = [x for x in s1 if x in match] == [x for x in s2 if x in match]
+    return float(len(match)) / max(len(s1), len(s2)), ordered
+
+def strip_and_compare(t1, t2):
+    t1 = re_and_of_space.sub('', t1).lower()
+    t2 = re_and_of_space.sub('', t2).lower()
+    return t1 == t2
+
+def compare_title(amazon, marc):
+    amazon_title = amazon['normalized_title'].lower()
+    marc_title = normalize(marc['full_title']).lower()
+    short = False
+    if len(amazon_title) < 9 or len(marc_title) < 9:
+        short = True
+
+    if not short:
+        for a in amazon['titles']:
+            for m in marc['titles']:
+                if a.lower() == m.lower():
+                    return ('full_title', 'exact match', 600)
+                if strip_and_compare(a, m):
+                    return ('full_title', 'exact match', 600)
+
+        for a in amazon['titles']:
+            for m in marc['titles']:
+                if substr_match(a.lower(), m.lower()):
+                    return ('full_title', 'contained within other title', 350)
+
+    max_score = 0
+    for a in amazon['titles']:
+        for m in marc['titles']:
+            percent, ordered = keyword_match(a, m)
+            score = percent * 450
+            if ordered:
+                score += 50
+            if score and score > max_score:
+                max_score = score
+    if max_score:
+        return ('full_title', 'keyword match', max_score)
+    elif short:
+        return ('full_title', 'shorter than 9 characters', 0)
+    else:
+        return ('full_title', 'mismatch', -600)
+
+def compare_number_of_pages(amazon, marc):
+    if 'number_of_pages' not in amazon or 'number_of_pages' not in marc:
+        return
+    amazon_pages = amazon['number_of_pages']
+    marc_pages = marc['number_of_pages']
+    if amazon_pages == marc_pages:
+        if amazon_pages > 10:
+            return ('number_of_pages', 'match exactly and > 10', 100)
+        else:
+            return ('number_of_pages', 'match exactly and < 10', 50)
+    elif within(amazon_pages, marc_pages, 10):
+        if amazon_pages > 10 and marc_pages > 10:
+            return ('number_of_pages', 'match within 10 and both are > 10', 50)
+        else:
+            return ('number_of_pages', 'match within 10 and either are < 10', 20)
+    else:
+        return ('number_of_pages', 'non-match (by more than 10)', -225)
+
+def short_part_publisher_match(p1, p2):
+    pub1 = p1.split()
+    pub2 = p2.split()
+    if len(pub1) == 1 or len(pub2) == 1:
+        return False
+    for i, j in zip(pub1, pub2):
+        if not substr_match(i, j):
+            return False
+    return True
+
+re_press = re.compile(' press$')
+
+def compare_publisher(amazon, marc):
+    if 'publishers' not in amazon or 'publishers' not in marc:
+        return ('publishers', 'either missing', 0)
+
+    assert 'publishers' in amazon and 'publishers' in marc
+    for amazon_pub in amazon['publishers']:
+        norm_amazon = normalize(amazon_pub)
+        for marc_pub in marc['publishers']:
+            norm_marc = normalize(marc_pub)
+            if norm_amazon == norm_marc:
+                return ('publishers', 'match', 100)
+#            if re_press.sub('', norm_amazon) == re_press.sub('', norm_marc):
+#                return ('publishers', 'match', 100)
+            if substr_match(norm_amazon, norm_marc):
+                return ('publishers', 'occur within the other', 100)
+            if substr_match(norm_amazon.replace(' ', ''), norm_marc.replace(' ', '')):
+                return ('publishers', 'occur within the other', 100)
+            if short_part_publisher_match(norm_amazon, norm_marc):
+                return ('publishers', 'match', 100)
+    return ('publishers', 'mismatch', -25)
+
+def level2_merge(amazon, marc):
+    warnings.warn('Deprecated, use openlibrary.catalog.merge.merge_marc.level2_merge() instead.', DeprecationWarning)
+    score = []
+    score.append(compare_date(amazon, marc))
+    score.append(compare_isbn10(amazon, marc))
+    score.append(compare_title(amazon, marc))
+    page_score = compare_number_of_pages(amazon, marc)
+    if page_score:
+        score.append(page_score)
+
+    score.append(compare_publisher(amazon, marc))
+    score.append(compare_authors(amazon, marc))
+
+    return score
+
+def full_title(edition):
+    title = edition['title']
+    if 'subtitle' in edition:
+        title += ' ' + edition['subtitle']
+    return title
+
+
+def attempt_merge(amazon, marc, threshold, debug = False):
+    warnings.warn('Deprecated, use openlibrary.catalog.merge.merge_marc.attempt_merge() instead.', DeprecationWarning)
+    l1 = level1_merge(amazon, marc)
+    total = sum(i[2] for i in l1)
+    if debug:
+        print(total, l1)
+    if total >= threshold:
+        return True
+    l2 = level2_merge(amazon, marc)
+    total = sum(i[2] for i in l2)
+    if debug:
+        print(total, l2)
+    return total >= threshold
diff --git a/ia-legacy-importer/merge/build_db.py b/ia-legacy-importer/merge/build_db.py
new file mode 100644
index 00000000..d27e2732
--- /dev/null
+++ b/ia-legacy-importer/merge/build_db.py
@@ -0,0 +1,141 @@
+#!/usr/bin/python2.5
+# converts from text files containing MARC tags to text versions of merge pools
+
+from __future__ import print_function
+import re
+import anydbm
+from time import time
+from collections import defaultdict
+
+grand_total = 31388611
+
+archive = [
+    ('marc_western_washington_univ', 'Western Washington University', 737442),
+    ('marc_records_scriblio_net', 'Library of Congress', 7025345),
+    ('marc_university_of_toronto', 'University of Toronto', 5585777),
+    ('marc_miami_univ_ohio', 'Miami University', 2029148),
+    ('bcl_marc', 'Boston College', 1983155),
+    ('bpl_marc', 'Boston Public Library', 2165372),
+    ('unc_catalog_marc', 'University of North Carolina at Chapel Hill', 3738594),
+    ('marc_oregon_summit_records', 'Oregon Summit', 3275046),
+    ('talis_openlibrary_contribution', 'Talis', 4848732),
+]
+
+path = '/0/pharos/edward/db/'
+
+re_isbn = re.compile('([^ ()]+[\dX])(?: \((?:v\. (\d+)(?: : )?)?(.*)\))?')
+re_question = re.compile('^\?+$')
+re_lccn = re.compile('(...\d+).*')
+re_oclc = re.compile ('^\(OCoLC\).*?0*(\d+)', re.IGNORECASE)
+
+re_normalize = re.compile('[^\w ]')
+re_whitespace = re.compile('\s+')
+
+def normalize(s):
+    s = re_normalize.sub('', s.strip())
+    s = re_whitespace.sub(' ', s)
+    return s.lower()
+
+def add_to_map(d, k, loc):
+    d[k].append(loc)
+
+def add_title_to_map(title, loc):
+    title = str(normalize(title)[:25])
+    add_to_map(title_map, title, loc)
+
+def add_title(prefix_len, subtags):
+    title_and_subtitle = []
+    title = []
+    for k, v in subtags:
+        if k not in ('a', 'b'):
+            continue
+        v = v.strip(' /,;:')
+        title_and_subtitle.append(v)
+        if k == 'a':
+            title.append(v)
+
+    titles = [' '.join(title)]
+    if title != title_and_subtitle:
+        titles.append(' '.join(title_and_subtitle))
+    if prefix_len and prefix_len != '0':
+        try:
+            prefix_len = int(prefix_len)
+            titles += [t[prefix_len:] for t in titles]
+        except ValueError:
+            pass
+    return titles
+
+loc_num = 0
+
+def write_map(archive_id, name, d):
+    f = open('d/' + archive_id + '_' + name, 'w')
+    for k, v in d.iteritems():
+        f.write(k + '\t' + ' '.join([str(i) for i in v]) + '\n')
+    f.close()
+
+def add_record(edition):
+    global loc_num
+    loc_str, tags = edition
+    loc_num+=1
+    f_loc.write(str(loc_num) + ' ' + loc_str + '\n')
+    loc = loc_num
+    for tag, ind, subtags in tags:
+        if tag == '010':
+            for k, v in subtags:
+                lccn = v.strip()
+                if re_question.match(lccn):
+                    continue
+                m = re_lccn.search(lccn)
+                if m:
+                    add_to_map(lccn_map, m.group(1), loc)
+            continue
+        if tag == '020':
+            for k, v in subtags:
+                m = re_isbn.match(v)
+                if m:
+                    add_to_map(isbn_map, m.group(1), loc)
+            continue
+        if tag == '035':
+            for k, v in subtags:
+                m = re_oclc.match(v)
+                if m:
+                    add_to_map(oclc_map, m.group(1), loc)
+            continue
+        if tag == '245':
+            for t in add_title(ind[1], subtags):
+                add_title_to_map(t, loc)
+            continue
+
+overall = 0
+t0_overall = time()
+f_loc = open('d/loc_map', 'w')
+for archive_id, name, total in sorted(archive, key=lambda x: x[2]):
+    t0 = time()
+    i = 0
+
+    isbn_map = defaultdict(list)
+    lccn_map = defaultdict(list)
+    title_map = defaultdict(list)
+    oclc_map = defaultdict(list)
+    print(archive_id)
+    for line in open(archive_id):
+        rec = eval(line)
+        add_record(rec)
+        i+=1
+        overall+=1
+        if i % 10000 == 0:
+            t1 = time() - t0
+            t1_overall = time() - t0_overall
+            remaining = total - i
+            remaining2 = grand_total - overall
+            print("%8d %6.2f%% %5.3f rec/sec %.3f minutes left" % (i, (float(i) * 100) / total, i/t1, float((t1/i) * remaining) / 60), end=' ')
+            print("overall: %6.2f%% %.3f minutes left" % ((float(overall) * 100) / grand_total, float((t1_overall/overall) * remaining2) / 60))
+
+    print(archive_id)
+    write_map(archive_id, 'isbn', isbn_map)
+    write_map(archive_id, 'lccn', lccn_map)
+    write_map(archive_id, 'title', title_map)
+    write_map(archive_id, 'oclc', oclc_map)
+
+f_loc.close()
+print('end')
diff --git a/ia-legacy-importer/merge/index.py b/ia-legacy-importer/merge/index.py
new file mode 100644
index 00000000..818fcdda
--- /dev/null
+++ b/ia-legacy-importer/merge/index.py
@@ -0,0 +1,83 @@
+from normalize import normalize
+from time import time
+import re
+
+def add_to_index(dbm, key, edition_key):
+    if not key:
+        return
+    try:
+        key = str(key)
+    except UnicodeEncodeError:
+        return
+    if key in dbm:
+        dbm[key] += ' ' + edition_key
+    else:
+        dbm[key] = edition_key
+
+def short_title(s):
+    return normalize(s)[:25]
+
+re_letters = re.compile('[A-Za-z]')
+
+def clean_lccn(lccn):
+    return re_letters.sub('', lccn).strip()
+
+re_isbn = re.compile('([-0-9X]{10,})')
+
+def clean_isbn(isbn):
+    m = re_isbn.search(isbn)
+    if m:
+        return m.group(1).replace('-', '')
+
+def record_to_dbm(record, dbm):
+    def callback(field, value, key):
+        add_to_index(dbm[field], value, key)
+    read_record(record, callback)
+
+def read_record(record, callback):
+    if 'title' not in record or record['title'] is None:
+        return
+    if 'subtitle' in record and record['subtitle'] is not None:
+        title = record['title'] + ' ' + record['subtitle']
+    else:
+        title = record['title']
+    key = record['key']
+    callback('title', short_title(title), key)
+    if 'title_prefix' in record and record['title_prefix'] is not None:
+        title2 = short_title(record['title_prefix'] + title)
+        callback('title', title2, key)
+
+    fields = [
+        ('lccn', 'lccn', clean_lccn),
+        ('oclc_numbers', 'oclc', None),
+        ('isbn_10', 'isbn', clean_isbn),
+        ('isbn_13', 'isbn', None),
+    ]
+    for a, b, clean in fields:
+        if a not in record:
+            continue
+        for v in record[a]:
+            if not v:
+                continue
+            if clean:
+                v = clean(v)
+                if not v:
+                    continue
+            callback(b, v, key)
+
+def test_read_record():
+    def empty_dbm():
+        return dict((i, {}) for i in ('lccn', 'oclc', 'isbn', 'title'))
+
+    dbm = empty_dbm()
+
+    line = '{"title_prefix": null, "subtitle": null, "description": null, "language": null, "title": "Metamagical Themas", "by_statement": null, "notes": null, "language_code": null, "id": 9888119, "edition_name": null, "publish_date": null, "key": "/b/OL7254007M", "authors": [{"key": "/a/OL2621476A"}], "ocaid": null, "type": "/type/edition", "coverimage": null}'
+    line = line.replace('null', 'None')
+    record = eval(line)
+    read_record(record, dbm)
+    assert dbm == { 'lccn': {}, 'isbn': {}, 'oclc': {}, 'title': {'metamagical themas': '9888119'} }
+
+    record = {"pagination": "8, 304 p.", "description": "Test", "title": "Kabita\u0304.", "lccn": ["sa 64009056"], "notes": "Bibliographical footnotes.\r\nIn Oriya.", "number_of_pages": 304, "languages": [{"key": "/l/ori"}], "authors": [{"key": "/a/OL1A"}], "lc_classifications": ["PK2579.R255 K3"], "publish_date": "1962", "publish_country": "ii ", "key": "/b/OL1M", "language_code": "304", "coverimage": "/static/images/book.trans.gif", "oclc_numbers": ["31249133"], "type": "/type/edition", "id": 96}
+    dbm = empty_dbm()
+    read_record(record, dbm)
+    assert dbm == {'lccn': {'64009056': '96'}, 'isbn': {}, 'oclc': {'31249133': '96'}, 'title': {'kabitau0304': '96'}}
diff --git a/ia-legacy-importer/merge/load_from_json.py b/ia-legacy-importer/merge/load_from_json.py
new file mode 100644
index 00000000..847ac086
--- /dev/null
+++ b/ia-legacy-importer/merge/load_from_json.py
@@ -0,0 +1,110 @@
+from __future__ import print_function
+# build a merge database from JSON dump
+
+import simplejson
+import re
+from normalize import normalize
+from time import time
+
+re_escape = re.compile(r'[\n\r\t\0\\]')
+trans = { '\n': '\\n', '\r': '\\r', '\t': '\\t', '\\': '\\\\', '\0': '', }
+
+def esc_group(m):
+    return trans[m.group(0)]
+def esc(str): return re_escape.sub(esc_group, str)
+
+def add_to_index(fh, value, key):
+    if not value:
+        return
+    try:
+        value = str(value)
+    except UnicodeEncodeError:
+        return
+    print("\t".join([key, esc(value)]), file=fh)
+
+def short_title(s):
+    return normalize(s)[:25]
+
+re_letters = re.compile('[A-Za-z]')
+re_dash_or_space = re.compile('[- ]')
+
+def clean_lccn(lccn):
+    return re_letters.sub('', lccn).strip()
+
+def clean_isbn(isbn):
+    return re_dash_or_space.sub('', isbn)
+
+def load_record(record, f):
+    if 'title' not in record or record['title'] is None:
+        return
+    if 'subtitle' in record and record['subtitle'] is not None:
+        title = record['title'] + ' ' + record['subtitle']
+    else:
+        title = record['title']
+    key = record['key']
+    add_to_index(f['title'], short_title(title), key)
+    if 'title_prefix' in record and record['title_prefix'] is not None:
+        title2 = short_title(record['title_prefix'] + title)
+        add_to_index(f['title'], title2, key)
+
+    fields = [
+        ('lccn', 'lccn', clean_lccn),
+        ('oclc_numbers', 'oclc', None),
+        ('isbn_10', 'isbn', clean_isbn),
+        ('isbn_13', 'isbn', clean_isbn),
+    ]
+    for a, b, clean in fields:
+        if a not in record:
+            continue
+        for v in record[a]:
+            if not v or b=='isbn' and len(v) < 10:
+                continue
+            if clean:
+                v = clean(v)
+            add_to_index(f[b], v, key)
+
+total = 29107946 # FIXME
+
+path = '/1/edward/index/'
+index_fields = ('lccn', 'oclc', 'isbn', 'title')
+files = dict((i, open(path + i, 'w')) for i in index_fields)
+
+rec_no = 0
+chunk = 10000
+t0 = time()
+t_prev = time()
+
+filename = '/1/anand/bsddb/json.txt'
+for line in open(filename):
+    rec_no += 1
+
+    if rec_no % chunk == 0:
+        t = time() - t_prev
+        t_prev = time()
+        t1 = time() - t0
+        rec_per_sec = chunk / t
+        rec_per_sec_total = rec_no / t1
+        remaining = total - rec_no
+        sec = remaining / rec_per_sec_total
+        print("%d current: %.3f overall: %.3f" % \
+            (rec_no, rec_per_sec, rec_per_sec_total), end=' ')
+        mins = sec / 60
+        print("%.3f minutes left" % mins)
+
+    # split line
+    key, type, json_data = line.split('\t')
+    if type != '/type/edition':
+        continue
+    try:
+        rec = simplejson.loads(json_data)
+        load_record(rec, files)
+    except:
+        print('record number:', rec_no)
+        print(line)
+        raise
+
+print(rec_no)
+print("closing files")
+for v in files.values():
+    v.close()
+print("finished")
diff --git a/ia-legacy-importer/merge/merge.py b/ia-legacy-importer/merge/merge.py
new file mode 100644
index 00000000..8fd27067
--- /dev/null
+++ b/ia-legacy-importer/merge/merge.py
@@ -0,0 +1,258 @@
+import re
+import warnings
+
+from openlibrary.catalog.merge.names import match_name
+from openlibrary.catalog.merge.normalize import normalize
+
+
+re_amazon_title_paren = re.compile(r'^(.*) \([^)]+?\)$')
+re_and_of_space = re.compile(' and | of | ')
+
+isbn_match = 85
+
+def set_isbn_match(score):
+    isbn_match = score
+
+
+def build_titles(title):
+    normalized_title = normalize(title).lower()
+    titles = [ title, normalized_title ];
+    if title.find(' & ') != -1:
+        t = title.replace(" & ", " and ")
+        titles.append(t)
+        titles.append(normalize(t))
+    t2 = []
+    for t in titles:
+        if t.lower().startswith('the '):
+            t2.append(t[4:])
+        elif t.lower().startswith('a '):
+            t2.append(t[2:])
+    titles += t2
+
+    if re_amazon_title_paren.match(title):
+        t2 = []
+        for t in titles:
+            m = re_amazon_title_paren.match(t)
+            if m:
+                t2.append(m.group(1))
+                t2.append(normalize(m.group(1)))
+        titles += t2
+
+    return {
+        'full_title':       title,
+        'normalized_title': normalized_title,
+        'titles':           titles,
+        'short_title':      normalized_title[:25],
+    }
+
+def within(a, b, distance):
+    return abs(a-b) <= distance
+
+def compare_date(e1, e2):
+    if 'publish_date' not in e1 or 'publish_date' not in e2:
+        return ('date', 'value missing', 0)
+    if e1['publish_date'] == e2['publish_date']:
+        return ('date', 'exact match', 200)
+    try:
+        e1_pub = int(e1['publish_date'])
+        e2_pub = int(e2['publish_date'])
+        if within(e1_pub, e2_pub, 1):
+            return ('date', 'within 1 year', 100)
+        elif within(e1_pub, e2_pub, 2):
+            return ('date', '+/-2 years', -25)
+        else:
+            return ('date', 'mismatch', -250)
+    except ValueError as TypeError:
+        return ('date', 'mismatch', -250)
+
+
+def compare_isbn10(e1, e2):
+    warnings.warn('Deprecated, use openlibrary.catalog.merge.merge_marc.compare_isbn10() instead.', DeprecationWarning)
+
+    if len(e1['isbn']) == 0 or len(e2['isbn']) == 0:
+        return ('ISBN', 'missing', 0)
+    for i in e1['isbn']:
+        for j in e2['isbn']:
+            if i == j:
+                return ('ISBN', 'match', isbn_match)
+
+    return ('ISBN', 'mismatch', -225)
+
+def level1_merge(e1, e2):
+    warnings.warn('Deprecated, use openlibrary.catalog.merge.merge_marc.level1_merge() instead.', DeprecationWarning)
+
+    score = []
+    if e1['short_title'] == e2['short_title']:
+        score.append(('short-title', 'match', 450))
+    else:
+        score.append(('short-title', 'mismatch', 0))
+
+    score.append(compare_date(e1, e2))
+    score.append(compare_isbn10(e1, e2))
+    return score
+
+def compare_authors(amazon, marc):
+    warnings.warn('Deprecated, use openlibrary.catalog.merge.merge_marc.compare_authors() instead.', DeprecationWarning)
+
+    if len(amazon['authors']) == 0 and 'authors' not in marc:
+        return ('main', 'no authors', 75)
+    if len(amazon['authors']) == 0:
+        return ('main', 'field missing from one record', -25)
+
+    for name in amazon['authors']:
+        if 'authors' in marc and match_name(name, marc['authors'][0]['name']):
+            return ('main', 'exact match', 125)
+        if 'by_statement' in marc and marc['by_statement'].find(name) != -1:
+            return ('main', 'exact match', 125)
+    if 'authors' not in marc:
+        return ('main', 'field missing from one record', -25)
+
+    max_score = 0
+    for a in amazon['authors']:
+        percent, ordered = keyword_match(a[0], marc['authors'][0]['name'])
+        if percent > 0.50:
+            score = percent * 80
+            if ordered:
+                score += 10
+            if score > max_score:
+                max_score = score
+    if max_score:
+        return ('main', 'keyword match', max_score)
+    else:
+        return ('main', 'mismatch', -200)
+
+def title_replace_amp(amazon):
+    return normalize(amazon['full-title'].replace(" & ", " and ")).lower()
+
+def substr_match(a, b):
+    return a.find(b) != -1 or b.find(a) != -1
+
+def keyword_match(in1, in2):
+    s1, s2 = [i.split() for i in (in1, in2)]
+    s1_set = set(s1)
+    s2_set = set(s2)
+    match = s1_set & s2_set
+    if len(s1) == 0 and len(s2) == 0:
+        return 0, True
+    ordered = [x for x in s1 if x in match] == [x for x in s2 if x in match]
+    return float(len(match)) / max(len(s1), len(s2)), ordered
+
+def strip_and_compare(t1, t2):
+    t1 = re_and_of_space.sub('', t1).lower()
+    t2 = re_and_of_space.sub('', t2).lower()
+    return t1 == t2
+
+def compare_title(amazon, marc):
+    amazon_title = amazon['normalized_title'].lower()
+    marc_title = normalize(marc['full_title']).lower()
+    short = False
+    if len(amazon_title) < 9 or len(marc_title) < 9:
+        short = True
+
+    if not short:
+        for a in amazon['titles']:
+            for m in marc['titles']:
+                if a.lower() == m.lower():
+                    return ('full-title', 'exact match', 600)
+                if strip_and_compare(a, m):
+                    return ('full-title', 'exact match', 600)
+
+        for a in amazon['titles']:
+            for m in marc['titles']:
+                if substr_match(a.lower(), m.lower()):
+                    return ('full-title', 'contained within other title', 350)
+
+    max_score = 0
+    for a in amazon['titles']:
+        for m in marc['titles']:
+            percent, ordered = keyword_match(a, m)
+            score = percent * 450
+            if ordered:
+                score += 50
+            if score and score > max_score:
+                max_score = score
+    if max_score:
+        return ('full-title', 'keyword match', max_score)
+    elif short:
+        return ('full-title', 'shorter than 9 characters', 0)
+    else:
+        return ('full-title', 'mismatch', -600)
+
+def compare_number_of_pages(amazon, marc):
+    if 'number_of_pages' not in amazon or 'number_of_pages' not in marc:
+        return
+    amazon_pages = amazon['number_of_pages']
+    marc_pages = marc['number_of_pages']
+    if amazon_pages == marc_pages:
+        if amazon_pages > 10:
+            return ('pagination', 'match exactly and > 10', 100)
+        else:
+            return ('pagination', 'match exactly and < 10', 50)
+    elif within(amazon_pages, marc_pages, 10):
+        if amazon_pages > 10 and marc_pages > 10:
+            return ('pagination', 'match within 10 and both are > 10', 50)
+        else:
+            return ('pagination', 'match within 10 and either are < 10', 20)
+    else:
+        return ('pagination', 'non-match (by more than 10)', -225)
+
+def short_part_publisher_match(p1, p2):
+    pub1 = p1.split()
+    pub2 = p2.split()
+    if len(pub1) == 1 or len(pub2) == 1:
+        return False
+    for i, j in zip(pub1, pub2):
+        if not substr_match(i, j):
+            return False
+    return True
+
+def compare_publisher(amazon, marc):
+    if 'publisher' in amazon and 'publishers' in marc:
+        amazon_pub = amazon['publisher']
+        norm_amazon = normalize(amazon_pub)
+        for marc_pub in marc['publishers']:
+            norm_marc = normalize(marc_pub)
+            if norm_amazon == norm_marc:
+                return ('publisher', 'match', 100)
+            elif substr_match(norm_amazon, norm_marc):
+                return ('publisher', 'occur within the other', 100)
+            elif substr_match(norm_amazon.replace(' ', ''), norm_marc.replace(' ', '')):
+                return ('publisher', 'occur within the other', 100)
+            elif short_part_publisher_match(norm_amazon, norm_marc):
+                return ('publisher', 'match', 100)
+        return ('publisher', 'mismatch', -25)
+
+    if 'publisher' not in amazon or 'publishers' not in marc:
+        return ('publisher', 'either missing', 0)
+
+def level2_merge(amazon, marc):
+    warnings.warn('Deprecated, use openlibrary.catalog.merge.merge_marc.level2_merge() instead.', DeprecationWarning)
+
+    score = []
+    score.append(compare_date(amazon, marc))
+    score.append(compare_isbn10(amazon, marc))
+    score.append(compare_title(amazon, marc))
+    page_score = compare_number_of_pages(amazon, marc)
+    if page_score:
+        score.append(page_score)
+
+    score.append(compare_publisher(amazon, marc))
+    score.append(compare_authors(amazon, marc))
+    return score
+
+def full_title(edition):
+    title = edition['title']
+    if 'subtitle' in edition:
+        title += ' ' + edition['subtitle']
+    return title
+
+def attempt_merge(amazon, marc, threshold):
+    warnings.warn('Deprecated, use openlibrary.catalog.merge.merge_marc.attempt_merge() instead.', DeprecationWarning)
+
+    l1 = level1_merge(amazon, marc)
+    total = sum(i[2] for i in l1)
+    if total >= threshold:
+        return True
+    l2 = level2_merge(amazon, marc)
+    total = sum(i[2] for i in l2)
+    return total >= threshold
diff --git a/ia-legacy-importer/merge/merge_bot/__init__.py b/ia-legacy-importer/merge/merge_bot/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/ia-legacy-importer/merge/merge_bot/bot.py b/ia-legacy-importer/merge/merge_bot/bot.py
new file mode 100755
index 00000000..d7b625fd
--- /dev/null
+++ b/ia-legacy-importer/merge/merge_bot/bot.py
@@ -0,0 +1,200 @@
+#!/usr/bin/python
+
+from __future__ import print_function
+import sys
+import web
+import sys
+import codecs
+from catalog.utils.query import query_iter, set_staging, withKey
+
+from catalog.merge.merge_marc import *
+from catalog.utils.query import get_mc, withKey
+import catalog.merge.amazon as merge_amazon
+import catalog.merge.merge_marc as merge_marc
+from catalog.merge.merge_bot.merge import amazon_and_marc, get_record
+from pprint import pformat
+
+sys.stdout = codecs.getwriter('utf-8')(sys.stdout)
+#set_staging(True)
+
+urls = (
+    '/', 'index'
+)
+app = web.application(urls, globals())
+
+threshold = 875
+
+#def text_box(k, input): return k
+
+def list_to_html(l):
+    def blue(s):
+        return ' <span style="color:blue; font-weight:bold">%s</span> ' % s
+    return blue('[') + blue('|').join(l) + blue(']')
+
+def as_html(x):
+    return list_to_html(x) if isinstance(x, list) else x
+
+class index:
+    def head(self, title):
+        style = '''
+body { font-family: Arial,Helvectica,Sans-serif }
+th { text-align: left; }
+td { background: #eee; }
+'''
+        return '<html>\n<head>\n<title>' + title + '</title>\n' + \
+            '<style>' + style + '</style>\n</head>\n<body>'
+
+    def tail(self):
+        return '</body>\n</html>\n'
+
+    def text_box(self, k):
+        if self.input[k]:
+            v = web.htmlquote(self.input[k])
+            return '<input type="text" name="%s" value="%s">' % (k, v)
+        else:
+            return '<input type="text" name="%s">' % k
+
+    def form(self):
+        return '<form>' \
+            + 'ISBN: ' + self.text_box('isbn') \
+            + ' or OCLC: ' + self.text_box('oclc') \
+            + ' <input type="submit" value="search">' \
+            + '</form>'
+
+    def field_table(self, input, rec_amazon, rec_marc):
+        yield '<table>'
+        yield '''<tr>
+<th>Field</th>
+<th>match</th>
+<th>score</th>
+<th>Amazon</th>
+<th>MARC</th>
+</tr>'''
+        total = 0
+        for field, match, score in input:
+            yield '<tr>'
+            yield '<td>%s</td>' % field
+            yield '<td>%s</td>' % web.htmlquote(match)
+            yield '<td>%s</td>' % score
+            yield '<td>%s</td>' % as_html(rec_amazon.get(field, None))
+#            if field == 'number_of_pages':
+#                yield '<td>%s</td>' % (web.htmlquote(rec_marc['pagination']) if 'pagination' in rec_marc else '<i>pagination missing</i>')
+            if field == 'authors':
+                authors = rec_marc.get(field, [])
+                yield '<td>%s</td>' % list_to_html(web.htmlquote(a['name']) for a in authors)
+            else:
+                yield '<td>%s</td>' % as_html(rec_marc.get(field, None))
+            yield '</tr>'
+            total += score
+        yield '</table>'
+        yield 'threshold %d, total: %d, ' % (threshold, total)
+        yield (('match' if total >= threshold else 'no match') + '<br>')
+
+    def marc_compare(self, editions):
+        key1 = editions[0]['key']
+        mc1 = get_mc(key1)
+        rec1 = get_record(key1, mc1)
+        key2 = editions[1]['key']
+        mc2 = get_mc(key2)
+        rec2 = get_record(key2, mc2)
+
+        yield '<h2>Level 1</h2>'
+        l1 = merge_marc.level1_merge(rec1, rec2)
+        for i in self.field_table(l1, rec1, rec2):
+            yield i
+
+        yield '<h2>Level 2</h2>'
+        l2 = merge_marc.level2_merge(rec1, rec2)
+        for i in self.field_table(l2, rec1, rec2):
+            yield i
+
+    def amazon_compare(self, editions):
+        key1 = editions[0]['key']
+        key2 = editions[1]['key']
+        try:
+            (rec_amazon, rec_marc) = amazon_and_marc(key1, key2)
+        except AssertionError:
+            yield 'must be one amazon and one marc edition'
+            return
+        yield '<h2>Level 1</h2>'
+        l1 = merge_amazon.level1_merge(rec_amazon, rec_marc)
+        for i in self.field_table(l1, rec_amazon, rec_marc):
+            yield i
+
+        yield '<h2>Level 2</h2>'
+        l2 = merge_amazon.level2_merge(rec_amazon, rec_marc)
+        for i in self.field_table(l2, rec_amazon, rec_marc):
+            yield i
+
+    def search(self, editions):
+        yield str(len(editions)) + ' editions found<p>'
+        yield '<table>'
+        yield '<tr><th>Key</th><th>OCLC</th><th>ISBN</th><th>title</th><th>subtitle</th></tr>'
+        for e in editions:
+            url = 'http://openlibrary.org' + e['key']
+            title = web.htmlquote(e['title']) if e['title'] else 'no title'
+            yield '<tr><td><a href="%s">%s</a></td>' % (url, e['key'])
+            yield '<td>%s</td><td>%s</td><td>%s</td><td>%s</td></tr>' % (e['oclc_numbers'], e['isbn_10'], title, (web.htmlquote(e['subtitle']) if e.get('subtitle', None) else '<i>no subtitle</i>'))
+        yield '</table><p>'
+
+        if len(editions) == 2:
+            yield '2 editions found, lets compare them<br>'
+            for i in self.marc_compare(editions):
+                yield i
+
+    def isbn_search(self, v):
+        q = {'type': '/type/edition', 'isbn_10': v, 'title': None, 'subtitle': None}
+        editions = []
+        for e in query_iter(q):
+            e['isbn_10'] = v
+            editions.append(e)
+        yield 'searching for ISBN ' + web.htmlquote(v) + ': '
+        for i in self.search(editions):
+            yield i
+
+    def oclc_search(self, v):
+        q = {'type': '/type/edition', 'oclc_numbers': v, 'title': None, 'subtitle': None, 'isbn_10': None}
+        editions = []
+        print(q)
+        for e in query_iter(q):
+            e['oclc_numbers'] = v
+            editions.append(e)
+        yield 'searching for OCLC ' + web.htmlquote(v) + ': '
+        for i in self.search(editions):
+            yield i
+
+    def title_search(self, v):
+        q = {'type': '/type/edition', 'isbn_10': None, 'title': v}
+        editions = []
+        for e in query_iter(q):
+            e['title'] = v
+            editions.append(e)
+        yield 'searcing for title "' + web.htmlquote(v) + '": '
+        for i in self.search(editions):
+            yield i
+
+    def GET(self):
+        #self.input = web.input(ol=None, isbn=None, title=None)
+        self.input = web.input(isbn=None, oclc=None)
+        ret = self.head('Merge debug')
+#        ret += web.htmlquote(repr(dict(self.input)))
+        for i in self.form():
+            ret += i
+        if self.input.isbn:
+            isbn = self.input.isbn
+            for i in self.isbn_search(isbn):
+                ret += i
+        elif self.input.oclc:
+            oclc = self.input.oclc
+            for i in self.oclc_search(oclc):
+                ret += i
+#        elif self.input.title:
+#            title = self.input.title
+#            for i in self.title_search(title):
+#                ret += i
+        ret += '</body>\n</html>\n'
+        return ret
+
+if __name__ == "__main__":
+    app.run()
+
diff --git a/ia-legacy-importer/merge/merge_bot/merge.py b/ia-legacy-importer/merge/merge_bot/merge.py
new file mode 100644
index 00000000..c159a5c8
--- /dev/null
+++ b/ia-legacy-importer/merge/merge_bot/merge.py
@@ -0,0 +1,82 @@
+#!/usr/bin/python2.5
+
+from __future__ import print_function
+import catalog.merge.merge_marc as marc
+import catalog.merge.amazon as amazon
+from catalog.utils.query import get_mc, withKey
+
+from catalog.get_ia import get_from_archive
+import catalog.marc.fast_parse as fast_parse
+
+def try_amazon(key):
+    thing = withKey(key)
+    if 'isbn_10' not in thing:
+        return None
+    if 'authors' in thing:
+        authors = []
+        for a in thing['authors']:
+            author_thing = withKey(a['key'])
+            if 'name' in author_thing:
+                authors.append(author_thing['name'])
+    else:
+        authors = []
+    return amazon.build_amazon(thing, authors)
+
+def get_record(key, mc):
+    data = get_from_archive(mc)
+    try:
+        rec = fast_parse.read_edition(data)
+    except (fast_parse.SoundRecording, IndexError, AssertionError):
+        print(mc)
+        print(key)
+        return False
+    try:
+        return marc.build_marc(rec)
+    except TypeError:
+        print(rec)
+        raise
+
+def attempt_merge(a, m, threshold, debug = False):
+    l1 = amazon.level1_merge(a, m)
+    total = sum(i[2] for i in l1)
+    if debug:
+        print(total, l1)
+    if total >= threshold:
+        return True
+    l2 = amazon.level2_merge(a, m)
+    total = sum(i[2] for i in l2)
+    if debug:
+        print(total, l2)
+    return total >= threshold
+
+sample_amazon = {'publishers': ['New Riders Press'], 'isbn': ['0321525655'], 'number_of_pages': 240, 'short_title': 'presentation zen simple i', 'normalized_title': 'presentation zen simple ideas on presentation design and delivery voices that matter', 'full_title': 'Presentation Zen Simple Ideas on Presentation Design and Delivery (Voices That Matter)', 'titles': ['Presentation Zen Simple Ideas on Presentation Design and Delivery (Voices That Matter)', 'presentation zen simple ideas on presentation design and delivery voices that matter', 'Presentation Zen Simple Ideas on Presentation Design and Delivery', 'presentation zen simple ideas on presentation design and delivery'], 'publish_date': '2007', 'authors': ['Garr Reynolds']}
+sample_marc = {'publishers': [u'New Riders'], 'isbn': ['9780321525659', '0321525655'], 'lccn': ['2008297172'], 'number_of_pages': 229, 'short_title': u'presentation zen simple i', 'normalized_title': u'presentation zen simple ideas on presentation design and delivery', 'full_title': u'Presentation zen simple ideas on presentation design and delivery', 'titles': [u'Presentation zen simple ideas on presentation design and delivery', u'presentation zen simple ideas on presentation design and delivery'], 'publish_date': '2008', 'publish_country': 'cau', 'authors': [{'db_name': u'Reynolds, Garr.', 'name': u'Reynolds, Garr.'}]}
+
+def amazon_and_marc(key1, key2):
+    if all(k in ('/b/OL9621221M', '/b/OL20749803M') for k in (key1, key2)):
+        return sample_amazon, sample_marc
+    mc1 = get_mc(key1)
+    mc2 = get_mc(key2)
+    if mc1.startswith('amazon:'):
+        assert not mc2.startswith('amazon:')
+        rec_amazon = try_amazon(key1)
+        rec_marc = get_record(key2, mc2)
+    else:
+        assert mc2.startswith('amazon:')
+        rec_amazon = try_amazon(key2)
+        rec_marc = get_record(key1, mc1)
+    return rec_amazon, rec_marc
+
+def marc_and_marc(key1, key2):
+    mc1 = get_mc(key1)
+    rec1 = get_record(key1, mc1)
+    mc2 = get_mc(key2)
+    rec2 = get_record(key2, mc2)
+    return rec1, rec2
+
+if __name__ == '__main__':
+    key1 = '/b/OL9621221M' # amazon
+    key2 = '/b/OL20749803M'
+    rec_amazon, rec_marc = amazon_and_marc(key1, key2)
+    threshold = 875
+    print(attempt_merge(rec_amazon, rec_marc, threshold, debug=True))
diff --git a/ia-legacy-importer/merge/merge_index.py b/ia-legacy-importer/merge/merge_index.py
new file mode 100644
index 00000000..25df8dd2
--- /dev/null
+++ b/ia-legacy-importer/merge/merge_index.py
@@ -0,0 +1,53 @@
+# build a merge database from JSON dump
+
+import re
+from normalize import normalize
+
+def short_title(s):
+    return normalize(s)[:25]
+
+re_letters = re.compile('[A-Za-z]')
+
+def clean_lccn(lccn):
+    return re_letters.sub('', lccn).strip()
+
+re_isbn = re.compile('([-0-9X]{10,})')
+
+def clean_isbn(isbn):
+    m = re_isbn.search(isbn)
+    if m:
+        return m.group(1).replace('-', '')
+
+
+
+def add_to_indexes(record):
+    if 'title' not in record or record['title'] is None:
+        return
+    if 'subtitle' in record and record['subtitle'] is not None:
+        title = record['title'] + ' ' + record['subtitle']
+    else:
+        title = record['title']
+    title1 = short_title(title)
+    yield 'title', title1
+    if 'title_prefix' in record and record['title_prefix'] is not None:
+        title2 = short_title(record['title_prefix'] + title)
+        if title1 != title2:
+            yield 'title', title2
+
+    fields = [
+        ('lccn', 'lccn', clean_lccn),
+        ('oclc_numbers', 'oclc', None),
+        ('isbn_10', 'isbn', clean_isbn),
+        ('isbn_13', 'isbn', None),
+    ]
+    for a, b, clean in fields:
+        if a not in record:
+            continue
+        for v in record[a]:
+            if not v or b=='isbn' and len(v) < 10:
+                continue
+            if clean:
+                v = clean(v)
+                if not v:
+                    continue
+            yield b, v
diff --git a/ia-legacy-importer/merge/merge_marc.py b/ia-legacy-importer/merge/merge_marc.py
new file mode 100644
index 00000000..487093f9
--- /dev/null
+++ b/ia-legacy-importer/merge/merge_marc.py
@@ -0,0 +1,342 @@
+from __future__ import print_function
+
+import re
+
+from openlibrary.catalog.merge.names import match_name
+from openlibrary.catalog.merge.normalize import normalize
+
+# fields needed for merge process:
+# title_prefix, title, subtitle, isbn, publish_country, lccn, publishers, publish_date, number_of_pages, authors
+
+re_amazon_title_paren = re.compile(r'^(.*) \([^)]+?\)$')
+
+isbn_match = 85
+
+def set_isbn_match(score):
+    isbn_match = score
+
+def build_titles(title):
+    """
+    Uses a full title to create normalized and short title versions.
+
+    :param str title: Full title of an edition
+    :rtype: dict
+    :return: An expanded set of title variations
+    """
+    normalized_title = normalize(title).lower()
+    titles = [ title, normalized_title ];
+    if title.find(' & ') != -1:
+        t = title.replace(" & ", " and ")
+        titles.append(t)
+        titles.append(normalize(t))
+    t2 = []
+    for t in titles:
+        if t.lower().startswith('the '):
+            t2.append(t[4:])
+        elif t.lower().startswith('a '):
+            t2.append(t[2:])
+    titles += t2
+
+    if re_amazon_title_paren.match(title):
+        t2 = []
+        for t in titles:
+            m = re_amazon_title_paren.match(t)
+            if m:
+                t2.append(m.group(1))
+                t2.append(normalize(m.group(1)))
+        titles += t2
+
+    return {
+        'full_title':       title,
+        'normalized_title': normalized_title,
+        'titles':           titles,
+        'short_title':      normalized_title[:25],
+    }
+
+def within(a, b, distance):
+    return abs(a-b) <= distance
+
+def compare_country(e1, e2):
+    field = 'publish_country'
+    if field not in e1 or field not in e2:
+        return (field, 'value missing', 0)
+    if e1[field] == e2[field]:
+        return (field, 'match', 40)
+    # West Berlin (wb) == Germany (gw)
+    if e1[field] in ('gw ', 'wb ') and e2[field] in ('gw ', 'wb '):
+        return (field, 'match', 40)
+    return (field, 'mismatch', -205)
+
+def compare_lccn(e1, e2):
+    field = 'lccn'
+    if field not in e1 or field not in e2:
+        return (field, 'value missing', 0)
+    if e1[field] == e2[field]:
+        return (field, 'match', 200)
+    return (field, 'mismatch', -320)
+
+def compare_date(e1, e2):
+    if 'publish_date' not in e1 or 'publish_date' not in e2:
+        return ('date', 'value missing', 0)
+    if e1['publish_date'] == e2['publish_date']:
+        return ('date', 'exact match', 200)
+    try:
+        e1_pub = int(e1['publish_date'])
+        e2_pub = int(e2['publish_date'])
+        if within(e1_pub, e2_pub, 2):
+            return ('date', '+/-2 years', -25)
+        else:
+            return ('date', 'mismatch', -250)
+    except ValueError as TypeError:
+        return ('date', 'mismatch', -250)
+
+def compare_isbn10(e1, e2):
+    if len(e1['isbn']) == 0 or len(e2['isbn']) == 0:
+        return ('ISBN', 'missing', 0)
+    for i in e1['isbn']:
+        for j in e2['isbn']:
+            if i == j:
+                return ('ISBN', 'match', isbn_match)
+    return ('ISBN', 'mismatch', -225)
+
+# 450 + 200 + 85 + 200
+
+def level1_merge(e1, e2):
+    """
+    :param dict e1, e2: editions to match
+    :rtype: list
+    :return: a list of tuples (field/category, result str, score int)
+    """
+    score = []
+    if e1['short_title'] == e2['short_title']:
+        score.append(('short-title', 'match', 450))
+    else:
+        score.append(('short-title', 'mismatch', 0))
+
+    score.append(compare_lccn(e1, e2))
+    score.append(compare_date(e1, e2))
+    score.append(compare_isbn10(e1, e2))
+    return score
+
+def level2_merge(e1, e2):
+    """
+    :rtype: list
+    :return: a list of tuples (field/category, result str, score int)
+    """
+    score = []
+    score.append(compare_date(e1, e2))
+    score.append(compare_country(e1, e2))
+    score.append(compare_isbn10(e1, e2))
+    score.append(compare_title(e1, e2))
+    score.append(compare_lccn(e1, e2))
+    page_score = compare_number_of_pages(e1, e2)
+    if page_score:
+        score.append(page_score)
+    score.append(compare_publisher(e1, e2))
+    score.append(compare_authors(e1, e2))
+    return score
+
+def compare_author_fields(e1_authors, e2_authors):
+    for i in e1_authors:
+        for j in e2_authors:
+            if normalize(i['db_name']) == normalize(j['db_name']):
+                return True
+            if normalize(i['name']).strip('.') == normalize(j['name']).strip('.'):
+                return True
+    return False
+
+def compare_author_keywords(e1_authors, e2_authors):
+    max_score = 0
+    for i in e1_authors:
+        for j in e2_authors:
+            percent, ordered = keyword_match(i['name'], j['name'])
+            if percent > 0.50:
+                score = percent * 80
+                if ordered:
+                    score += 10
+                if score > max_score:
+                    max_score = score
+    if max_score:
+        return ('authors', 'keyword match', max_score)
+    else:
+        return ('authors', 'mismatch', -200)
+
+
+def compare_authors(e1, e2):
+    """
+    Compares the authors of two edition representations and
+    returns a evaluation and score.
+
+    :param dict e1: Edition, output of build_marc()
+    :param dict e2: Edition, output of build_marc()
+    :rtype: tuple
+    :return: str?, message, score
+    """
+
+    if 'authors' in e1 and 'authors' in e2:
+        if compare_author_fields(e1['authors'], e2['authors']):
+            return ('authors', 'exact match', 125)
+    if 'authors' in e1 and 'contribs' in e2 and \
+            compare_author_fields(e1['authors'], e2['contribs']):
+        return ('authors', 'exact match', 125)
+    if 'contribs' in e1 and 'authors' in e2 and \
+            compare_author_fields(e1['contribs'], e2['authors']):
+        return ('authors', 'exact match', 125)
+    if 'authors' in e1 and 'authors' in e2:
+        return compare_author_keywords(e1['authors'], e2['authors'])
+
+    if 'authors' not in e1 and 'authors' not in e2:
+        if 'contribs' in e1 and 'contribs' in e2 and \
+                compare_author_fields(e1['contribs'], e2['contribs']):
+            return ('authors', 'exact match', 125)
+        return ('authors', 'no authors', 75)
+    return ('authors', 'field missing from one record', -25)
+
+
+def title_replace_amp(amazon):
+    return normalize(amazon['full-title'].replace(" & ", " and ")).lower()
+
+def substr_match(a, b):
+    return a.find(b) != -1 or b.find(a) != -1
+
+def keyword_match(in1, in2):
+    s1, s2 = [i.split() for i in (in1, in2)]
+    s1_set = set(s1)
+    s2_set = set(s2)
+    match = s1_set & s2_set
+    if len(s1) == 0 and len(s2) == 0:
+        return 0, True
+    ordered = [x for x in s1 if x in match] == [x for x in s2 if x in match]
+    return float(len(match)) / max(len(s1), len(s2)), ordered
+
+def compare_title(amazon, marc):
+    amazon_title = amazon['normalized_title'].lower()
+    marc_title = normalize(marc['full_title']).lower()
+    short = False
+    if len(amazon_title) < 9 or len(marc_title) < 9:
+        short = True
+
+    if not short:
+        for a in amazon['titles']:
+            for m in marc['titles']:
+                if a == m:
+                    return ('full-title', 'exact match', 600)
+
+        for a in amazon['titles']:
+            for m in marc['titles']:
+                if substr_match(a, m):
+                    return ('full-title', 'containted within other title', 350)
+
+    max_score = 0
+    for a in amazon['titles']:
+        for m in marc['titles']:
+            percent, ordered = keyword_match(a, m)
+            score = percent * 450
+            if ordered:
+                score += 50
+            if score and score > max_score:
+                max_score = score
+    if max_score:
+        return ('full-title', 'keyword match', max_score)
+    elif short:
+        return ('full-title', 'shorter than 9 characters', 0)
+    else:
+        return ('full-title', 'mismatch', -600)
+
+def compare_number_of_pages(amazon, marc):
+    if 'number_of_pages' not in amazon or 'number_of_pages' not in marc:
+        return
+    amazon_pages = amazon['number_of_pages']
+    marc_pages = marc['number_of_pages']
+    if amazon_pages == marc_pages:
+        if amazon_pages > 10:
+            return ('pagination', 'match exactly and > 10', 100)
+        else:
+            return ('pagination', 'match exactly and < 10', 50)
+    elif within(amazon_pages, marc_pages, 10):
+        if amazon_pages > 10 and marc_pages > 10:
+            return ('pagination', 'match within 10 and both are > 10', 50)
+        else:
+            return ('pagination', 'match within 10 and either are < 10', 20)
+    else:
+        return ('pagination', 'non-match (by more than 10)', -225)
+
+def short_part_publisher_match(p1, p2):
+    pub1 = p1.split()
+    pub2 = p2.split()
+    if len(pub1) == 1 or len(pub2) == 1:
+        return False
+    for i, j in zip(pub1, pub2):
+        if not substr_match(i, j):
+            return False
+    return True
+
+def compare_publisher(e1, e2):
+    if 'publishers' in e1 and 'publishers' in e2:
+        for e1_pub in e1['publishers']:
+            e1_norm = normalize(e1_pub)
+            for e2_pub in e2['publishers']:
+                e2_norm = normalize(e2_pub)
+                if e1_norm == e2_norm:
+                    return ('publisher', 'match', 100)
+                elif substr_match(e1_norm, e2_norm):
+                    return ('publisher', 'occur within the other', 100)
+                elif substr_match(e1_norm.replace(' ', ''), e2_norm.replace(' ', '')):
+                    return ('publisher', 'occur within the other', 100)
+                elif short_part_publisher_match(e1_norm, e2_norm):
+                    return ('publisher', 'match', 100)
+        return ('publisher', 'mismatch', -25)
+
+    if 'publishers' not in e1 or 'publishers' not in e2:
+        return ('publisher', 'either missing', 0)
+
+
+def build_marc(edition):
+    """
+    Returns an expanded representation of an edition dict,
+    usable for accurate comparisons between existing and new
+    records.
+    Called from openlibrary.catalog.add_book.load()
+
+    :param dict edition: Import edition representation, requires 'full_title'
+    :rtype: dict
+    :return: An expanded version of an edition dict
+        more titles, normalized + short
+        all isbns in "isbn": []
+    """
+    marc = build_titles(edition['full_title'])
+    marc['isbn'] = []
+    for f in 'isbn', 'isbn_10', 'isbn_13':
+        marc['isbn'].extend(edition.get(f, []))
+    if 'publish_country' in edition \
+            and edition['publish_country'] not in ('   ', '|||'):
+        marc['publish_country'] = edition['publish_country']
+    for f in 'lccn', 'publishers', 'publish_date', 'number_of_pages', 'authors', 'contribs':
+        if f in edition:
+            marc[f] = edition[f]
+    return marc
+
+
+def attempt_merge(e1, e2, threshold, debug=False):
+    """
+    Determines (according to a threshold) whether two edition representations are
+    sufficiently the same. Used when importing new books.
+
+    :param dict e1: dict representing an edition
+    :param dict e2: dict representing an edition
+    :param int threshold: each field match or difference adds or subtracts a score. Example: 875 for standard edition matching
+    :rtype: bool
+    :return: Whether two editions have sufficient fields in common to be considered the same
+    """
+    level1 = level1_merge(e1, e2)
+    total = sum(i[2] for i in level1)
+    if debug:
+        print("E1: %s\nE2: %s" % (e1, e2))
+        print("TOTAL 1: %s - %s" % (total, level1))
+    if total >= threshold:
+        return True
+    level2 = level2_merge(e1, e2)
+    total = sum(i[2] for i in level2)
+    if debug:
+        print("TOTAL 2: %s - %s" % (total, level2))
+    return total >= threshold
diff --git a/ia-legacy-importer/merge/names.py b/ia-legacy-importer/merge/names.py
new file mode 100644
index 00000000..594e5a66
--- /dev/null
+++ b/ia-legacy-importer/merge/names.py
@@ -0,0 +1,274 @@
+from __future__ import print_function
+import re
+from openlibrary.catalog.merge.normalize import normalize
+
+re_split_parts = re.compile('(.*?[. ]+)')
+re_marc_name = re.compile('^(.*), (.*)$')
+re_amazon_space_name = re.compile('^(.+?[^ ]) +([A-Z][a-z]?)$')
+
+verbose = False
+
+titles = frozenset([normalize(x) for x in ('Mrs', 'Sir', 'pseud', 'Lady', 'Baron', 'lawyer', 'Lord', 'actress', 'Dame', 'Mr', 'Viscount', 'professeur', 'Graf', 'Dr', 'Countess', 'Ministerialrat', 'Oberamtsrat', 'Rechtsanwalt')])
+
+
+def flip_name(name):
+    m = re_marc_name.match(name)
+    if not m:
+        return None
+    return m.group(2) + ' ' + m.group(1)
+
+def match_seq(parts1, parts2):
+    if len(parts1) == len(parts2):
+        return False
+    if len(parts1) > len(parts2):
+        longer, shorter = parts1, parts2
+    else:
+        longer, shorter = parts2, parts1
+
+    i = 0
+    for j in shorter:
+        while not compare_part(j, longer[i]):
+            i+=1
+            if i >= len(longer):
+                return False
+    return True
+
+def compare_part(p1, p2):
+    p1 = normalize(p1)
+    p2 = normalize(p2)
+    return p1.startswith(p2) or p2.startswith(p1)
+
+def compare_parts(parts1, parts2):
+    if len(parts1) != len(parts2):
+        return False
+    for i, j in zip(parts1, parts2):
+        if not compare_part(i, j):
+            return False
+    return True
+
+def split_parts(s):
+    parts = []
+    m = re_split_parts.match(s)
+    if not m:
+        return [s.strip()]
+    while m:
+        end = m.end()
+        parts.append(m.group(1).strip())
+        m = re_split_parts.match(s, end)
+    if end != len(s):
+        parts.append(s[end:].strip())
+    return parts
+
+def amazon_title(amazon_first_parts, marc_first_parts):
+    if normalize(amazon_first_parts[0]) not in titles:
+        return False
+    if compare_parts(marc_first_parts, amazon_first_parts[1:]):
+        if verbose:
+            print("match with Amazon title")
+        return True
+    if match_seq(marc_first_parts, amazon_first_parts[1:]):
+        if verbose:
+            print("partial match, with Amazon title")
+        return True
+    return False
+
+def marc_title(amazon_first_parts, marc_first_parts):
+#            print 'title found: ', marc_first_parts[-1]
+    if normalize(marc_first_parts[-1]) not in titles:
+        return False
+    if compare_parts(marc_first_parts[:-1], amazon_first_parts):
+        if verbose:
+            print("match with MARC end title")
+        return True
+    if normalize(amazon_first_parts[0]) in titles:
+        if compare_parts(marc_first_parts[:-1], amazon_first_parts[1:]):
+            if verbose:
+                print("match, both with titles")
+            return True
+        if match_seq(marc_first_parts[:-1], amazon_first_parts[1:]):
+            if verbose:
+                print("partial match, both with titles")
+            return True
+    if match_seq(marc_first_parts[:-1], amazon_first_parts):
+        if verbose:
+            print("partial match with MARC end title")
+        return True
+    if match_seq(marc_first_parts, amazon_first_parts):
+        if verbose:
+            print("partial match with MARC end title")
+    return False
+
+# use for person, org and event because the LC data says "Berkovitch, Israel." is an org
+
+def remove_trailing_dot(s):
+    s = s.strip()
+    if len(s) < 3 or not s.endswith('.') or s[-3] == ' ' or s[-3] == '.':
+        return s
+    return s[:-1]
+
+def flip_marc_name(marc):
+    m = re_marc_name.match(marc)
+    if not m:
+        return remove_trailing_dot(marc)
+    first_parts = split_parts(m.group(2))
+    if normalize(first_parts[-1]) not in titles:
+        # example: Eccles, David Eccles Viscount
+        return remove_trailing_dot(m.group(2)) + ' ' + m.group(1)
+    if len(first_parts) > 2 and normalize(first_parts[-2]) == normalize(m.group(1)):
+        return u' '.join(first_parts[0:-1])
+    return u' '.join(first_parts[:-1] + [m.group(1)])
+
+def match_marc_name(marc1, marc2, last_name_only_ok):
+    m1_normalized = normalize(marc1)
+    m2_normalized = normalize(marc2)
+    if m1_normalized == m2_normalized:
+        return True
+    m1 = re_marc_name.match(marc1)
+    m2 = re_marc_name.match(marc2)
+    if not m1:
+        if m2 and m1_normalized == normalize(m2.group(1)):
+            return last_name_only_ok
+        else:
+            return False
+    if not m2:
+        if m2_normalized == normalize(m1.group(1)):
+            return last_name_only_ok
+        else:
+            return False
+    if (m1_normalized == normalize(m2.group(2) + ' ' + m2.group(1)) or
+            m2_normalized == normalize(m1.group(2) + ' ' + m1.group(1))):
+        return True
+    if not (m1.group(1).endswith(' ' + m2.group(1)) or m1.endswith('.' + m2.group(1)) or
+            m2.group(1).endswith(' ' + m1.group(1)) or m2.endswith('.' + m1.group(1))):
+        return False # Last name mismatch
+    marc1_first_parts = split_parts(m1.group(2))
+    marc2_first_parts = split_parts(m2.group(2))
+    if compare_parts(marc1_first_parts, marc2_first_parts):
+        return True
+    if match_seq(marc1_first_parts, marc2_first_parts):
+        return True
+    if marc_title(marc1_first_parts, marc2_first_parts):
+        return True
+    if marc_title(marc2_first_parts, marc1_first_parts):
+        return True
+    if amazon_title(marc1_first_parts, marc2_first_parts):
+        return True
+    if amazon_title(marc2_first_parts, marc1_first_parts):
+        return True
+    return False
+
+# try different combinations looking for a match
+def match_name2(name1, name2):
+    if name1 == name2:
+        return True
+    n1_normalized = normalize(name1)
+    n2_normalized = normalize(name2)
+    if n1_normalized == n2_normalized:
+        return True
+    n1_parts = split_parts(name1)
+    n2_parts = split_parts(name2)
+    if compare_parts(n1_parts, n2_parts):
+        return True
+    if match_seq(n1_parts, n2_parts):
+        return True
+    if marc_title(n1_parts, n2_parts):
+        return True
+    if marc_title(n2_parts, n1_parts):
+        return True
+    if amazon_title(n1_parts, n2_parts):
+        return True
+    if amazon_title(n2_parts, n1_parts):
+        return True
+    return False
+
+def match_surname(surname, name):
+    if name.endswith(' ' + surname) or name.endswith('.' + surname):
+        return True
+    surname = surname.replace(' ', '')
+    if name.endswith(' ' + surname) or name.endswith('.' + surname):
+        return True
+    return False
+
+def amazon_spaced_name(amazon, marc):
+    len_amazon = len(amazon)
+    if len_amazon != 30 and len_amazon != 31:
+        return False
+    m = re_amazon_space_name.search(amazon)
+    if not m:
+        return False
+    amazon_surname = m.group(1)
+    if normalize(amazon_surname) == normalize(marc):
+        return True
+    amazon_initals = m.group(2)
+    m = re_marc_name.match(marc)
+    if not m:
+        return False
+    marc_surname = m.group(1)
+    if normalize(amazon_surname) != normalize(marc_surname):
+        return False
+    marc_first_parts = split_parts(m.group(2))
+    amazon_first_parts = [x for x in amazon_initals]
+    if compare_parts(marc_first_parts, amazon_first_parts):
+        return True
+    if match_seq(amazon_first_parts, marc_first_parts):
+        return True
+    return False
+
+def match_name(amazon, marc, last_name_only_ok=True):
+    if amazon_spaced_name(amazon, marc):
+        return True
+    amazon_normalized = normalize(amazon)
+    amazon_normalized_no_space = normalize(amazon).replace(' ', '')
+    marc_normalized = normalize(marc)
+    # catches events and organizations
+    if amazon_normalized == marc_normalized:
+        if verbose:
+            print('normalized names match')
+        return True
+    if amazon_normalized_no_space == marc_normalized.replace(' ', ''):
+        if verbose:
+            print('normalized, spaces removed, names match')
+        return True
+    # split MARC name
+    m = re_marc_name.match(marc)
+    if not m:
+        return False
+    surname = m.group(1)
+    surname_no_space = surname.replace(' ', '')
+    if amazon_normalized == normalize(surname) \
+            or amazon_normalized_no_space == normalize(surname_no_space):
+        if verbose:
+            print('Amazon only has a last name, it matches MARC')
+        return last_name_only_ok
+    if amazon_normalized == normalize(m.group(2) + ' ' + surname):
+        if verbose:
+            print('match')
+        return True
+    if amazon_normalized_no_space == normalize(m.group(2) + surname).replace(' ', ''):
+        if verbose:
+            print('match when spaces removed')
+        return True
+    if not match_surname(surname, amazon):
+        if verbose:
+            print('Last name mismatch')
+        return False
+    marc_first_parts = split_parts(m.group(2))
+    amazon_first_parts = split_parts(amazon[0:-(len(m.group(1))+1)])
+    if compare_parts(marc_first_parts, amazon_first_parts):
+        if verbose:
+            print("match")
+        return True
+    if marc_title(amazon_first_parts, marc_first_parts):
+        return True
+    if amazon_title(amazon_first_parts, marc_first_parts):
+        return True
+    if match_seq(amazon_first_parts, marc_first_parts):
+        if verbose:
+            print("partial match")
+        return True
+    if verbose:
+        print("no match")
+    return False
+
+def match_not_just_surname(amazon, marc):
+    return match_name(amazon, marc, last_name_only_ok=False)
diff --git a/ia-legacy-importer/merge/normalize.py b/ia-legacy-importer/merge/normalize.py
new file mode 100644
index 00000000..b6656527
--- /dev/null
+++ b/ia-legacy-importer/merge/normalize.py
@@ -0,0 +1,27 @@
+import re
+import unicodedata
+
+import six
+
+#re_brace = re.compile('{[^{}]+?}')
+re_normalize = re.compile('[^[:alpha:] ]', re.I)
+re_whitespace_and_punct = re.compile(r'[-\s,;:.]+')
+
+def normalize(s):
+    """
+    Normalizes title by lowercasing, unicode -> NFC,
+    stripping extra whitespace and punctuation, and replacing ampersands.
+    :param str s:
+    :rtype: str
+    """
+
+    if isinstance(s, six.text_type):
+        # LATIN SMALL LETTER L WITH STROKE' (U+0142) -> 'l'
+        s = unicodedata.normalize('NFC', s.replace(u'\u0142', u'l'))
+    s = s.replace(' & ', ' and ')
+    # remove {mlrhring} and friends
+    # see http://www.loc.gov/marc/mnemonics.html
+    # s = re_brace.sub('', s)
+    s = re_whitespace_and_punct.sub(' ', s.lower())
+    s = re_normalize.sub('', s.strip())
+    return s
diff --git a/ia-legacy-importer/merge/schema1.sql b/ia-legacy-importer/merge/schema1.sql
new file mode 100644
index 00000000..4c007717
--- /dev/null
+++ b/ia-legacy-importer/merge/schema1.sql
@@ -0,0 +1,58 @@
+create table isbn (
+    key varchar(16) not null,
+    value varchar(16) not null
+);
+
+create table oclc (
+    key varchar(16) not null,
+    value varchar(16) not null
+);
+
+create table title (
+    key varchar(16) not null,
+    value varchar(25) not null
+);
+
+create table lccn (
+    key varchar(16) not null,
+    value varchar(16) not null
+);
+
+create table marc_source (
+    id serial not null,
+    archive_id varchar(100) not null unique,
+    name varchar(100)
+);
+
+create table marc_file (
+    id serial not null,
+    marc_source integer not null,
+    filename varchar(100) not null
+);
+
+create table marc_rec (
+    id serial not null,
+    marc_file integer not null,
+    pos bigint not null,
+    len integer not null
+);
+
+create table marc_isbn (
+    marc_rec integer not null,
+    value varchar(16) not null
+);
+
+create table marc_oclc (
+    marc_rec integer not null,
+    value varchar(16) not null
+);
+
+create table marc_lccn (
+    marc_rec integer not null,
+    value varchar(16) not null
+);
+
+create table marc_title (
+    marc_rec integer not null,
+    value varchar(25) not null
+);
diff --git a/ia-legacy-importer/merge/schema2.sql b/ia-legacy-importer/merge/schema2.sql
new file mode 100644
index 00000000..2c89d8f1
--- /dev/null
+++ b/ia-legacy-importer/merge/schema2.sql
@@ -0,0 +1,8 @@
+alter table isbn add primary key (key, value);
+create index isbn_index on isbn (value);
+alter table oclc add primary key (key, value);
+create index oclc_index on oclc (value);
+alter table title add primary key (key, value);
+create index title_index on title (value);
+alter table lccn add primary key (key, value);
+create index lccn_index on lccn (value);
diff --git a/ia-legacy-importer/merge/test_amazon.py b/ia-legacy-importer/merge/test_amazon.py
new file mode 100644
index 00000000..f2c730a2
--- /dev/null
+++ b/ia-legacy-importer/merge/test_amazon.py
@@ -0,0 +1,117 @@
+import pytest
+from openlibrary.catalog.merge.amazon import (
+        attempt_merge,
+        compare_authors, compare_publisher,
+        full_title, build_titles, compare_title)
+
+def test_compare_authors_by_statement():
+    amazon = {'authors': [u'Alistair Smith', u'Author']}
+    marc = {'authors': [{'db_name': u'National Gallery (Great Britain)', 'name': u'National Gallery (Great Britain)', 'entity_type': 'org'}], 'by_statement': 'Alistair Smith.'}
+    assert compare_authors(amazon, marc) == ('authors', 'exact match', 125)
+
+def test_compare_publisher():
+    amazon = { 'publishers': ['foo'] }
+    amazon2 = { 'publishers': ['bar'] }
+    marc = { 'publishers': ['foo'] }
+    marc2 = { 'publishers': ['foo', 'bar'] }
+    assert compare_publisher({}, {}) == ('publishers', 'either missing', 0)
+    assert compare_publisher(amazon, {}) == ('publishers', 'either missing', 0)
+    assert compare_publisher({}, marc) == ('publishers', 'either missing', 0)
+    assert compare_publisher(amazon, marc) == ('publishers', 'match', 100)
+    assert compare_publisher(amazon2, marc) == ('publishers', 'mismatch', -25)
+    assert compare_publisher(amazon2, marc2) == ('publishers', 'match', 100)
+
+def test_full_title():
+    assert full_title({ 'title': 'Hamlet'}) == 'Hamlet'
+    edition = {
+        'title': 'Flatland',
+        'subtitle': 'A Romance of Many Dimensions',
+    }
+    assert full_title(edition) == 'Flatland A Romance of Many Dimensions'
+
+def test_build_titles():
+    a = 'This is a title.'
+    normalized = 'this is a title'
+    result = build_titles(a)
+    assert result['full_title'] == a
+    assert result['short_title'] == normalized
+    assert result['normalized_title'] == normalized
+
+def test_merge_titles():
+    marc = {
+        'title_with_subtitles': 'Spytime : the undoing of James Jesus Angleton : a novel',
+        'title': 'Spytime',
+        'full_title': 'Spytime : the undoing of James Jesus Angleton : a novel',
+    }
+    amazon = {
+        'subtitle': 'The Undoing oF James Jesus Angleton',
+        'title': 'Spytime',
+    }
+    amazon = build_titles(full_title(amazon))
+    marc = build_titles(marc['title_with_subtitles'])
+    assert amazon['short_title'] == marc['short_title']
+    assert compare_title(amazon, marc) == ('full_title', 'contained within other title', 350)
+
+def test_merge_titles2():
+    amazon = {'title': u'Sea Birds Britain Ireland'}
+    marc = {
+        'title_with_subtitles': u'seabirds of Britain and Ireland',
+        'title': u'seabirds of Britain and Ireland',
+        'full_title': u'The seabirds of Britain and Ireland',
+    }
+    amazon = build_titles(full_title(amazon))
+    marc = build_titles(marc['title_with_subtitles'])
+    assert compare_title(amazon, marc) == ('full_title', 'exact match', 600)
+
+def test_merge():
+    amazon = {'publishers': [u'Collins'], 'isbn': ['0002167360'], 'number_of_pages': 120, 'short_title': u'souvenirs', 'normalized_title': u'souvenirs', 'full_title': u'Souvenirs', 'titles': [u'Souvenirs', u'souvenirs'], 'publish_date': u'1975', 'authors': [u'David Hamilton', u'Photographer']}
+    marc = {'publisher': [u'Collins'], 'isbn': [u'0002167360'], 'short_title': u'souvenirs', 'normalized_title': u'souvenirs', 'full_title': u'Souvenirs', 'titles': [u'Souvenirs', u'souvenirs'], 'publish_date': '1978', 'authors': [{'birth_date': u'1933', 'db_name': u'Hamilton, David 1933-', 'entity_type': 'person', 'name': u'Hamilton, David', 'personal_name': u'Hamilton, David'}], 'source_record_loc': 'marc_records_scriblio_net/part11.dat:155728070:617', 'number_of_pages': 120}
+    # these records match with threshold = 650, but do not with threshold = 735
+    threshold = 735
+    assert attempt_merge(amazon, marc, 650)
+    assert not attempt_merge(amazon, marc, threshold)
+
+def test_merge2():
+    amazon = {'publishers': [u'Collins'], 'isbn': ['0002167530'], 'number_of_pages': 287, 'short_title': u'sea birds britain ireland', 'normalized_title': u'sea birds britain ireland', 'full_title': u'Sea Birds Britain Ireland', 'titles': [u'Sea Birds Britain Ireland', u'sea birds britain ireland'], 'publish_date': u'1975', 'authors': ['Stanley Cramp']}
+    marc = {'publisher': [u'Collins'], 'isbn': [u'0002167530'], 'short_title': u'seabirds of britain and i', 'normalized_title': u'seabirds of britain and ireland', 'full_title': u'seabirds of Britain and Ireland', 'titles': [u'seabirds of Britain and Ireland', u'seabirds of britain and ireland'], 'publish_date': '1974', 'authors': [{'db_name': u'Cramp, Stanley.', 'entity_type': 'person', 'name': u'Cramp, Stanley.', 'personal_name': u'Cramp, Stanley.'}], 'source_record_loc': 'marc_records_scriblio_net/part08.dat:61449973:855'}
+    threshold = 735
+    assert attempt_merge(amazon, marc, threshold)
+
+@pytest.mark.skip(reason="Did not pass when rescuing tests. Check thresholds.")
+def test_merge3():
+    amazon = {'publishers': [u'Intl Specialized Book Service Inc'], 'isbn_10': ['0002169770'], 'number_of_pages': 207, 'short_title': u'women of the north', 'normalized_title': u'women of the north', 'full_title': u'Women of the North', 'titles': [u'Women of the North', u'women of the north'], 'publish_date': u'1985', 'authors': [(u'Jane Wordsworth', u'Author')]}
+    marc = {'publisher': [u'Collins', u'Exclusive distributor ISBS'], 'isbn_10': [u'0002169770'], 'short_title': u'women of the north', 'normalized_title': u'women of the north', 'full_title': u'Women of the North', 'titles': [u'Women of the North', u'women of the north'], 'publish_date': '1981', 'number_of_pages': 207, 'authors': [{'db_name': u'Wordsworth, Jane.', 'entity_type': 'person', 'name': u'Wordsworth, Jane.', 'personal_name': u'Wordsworth, Jane.'}], 'source_record_loc': 'marc_records_scriblio_net/part17.dat:110989084:798'}
+    threshold = 735
+    assert attempt_merge(amazon, marc, threshold)
+
+@pytest.mark.skip(reason="Did not pass when rescuing tests. Check thresholds.")
+def test_merge4():
+    amazon = {'publishers': [u'HarperCollins Publishers Ltd'], 'isbn_10': ['0002173433'], 'number_of_pages': 128, 'short_title': u'd day to victory', 'normalized_title': u'd day to victory', 'full_title': u'D-Day to Victory', 'titles': [u'D-Day to Victory', u'd day to victory'], 'publish_date': u'1984', 'authors': [(u'Wynfod Vaughan-Thomas', u'Editor, Introduction')]}
+    marc = {'publisher': [u'Collins'], 'isbn_10': [u'0002173433'], 'short_title': u'great front pages  d day ', 'normalized_title': u'great front pages  d day to victory 1944 1945', 'full_title': u'Great front pages : D-Day to victory 1944-1945', 'titles': [u'Great front pages : D-Day to victory 1944-1945', u'great front pages  dday to victory 1944 1945'], 'publish_date': '1984', 'number_of_pages': 128, 'by_statement': 'introduced by Wynford Vaughan-Thomas.', 'source_record_loc': 'marc_records_scriblio_net/part17.dat:102360356:983'}
+    threshold = 735
+    assert attempt_merge(amazon, marc, threshold)
+
+def test_merge5():
+    amazon = {'publishers': [u'HarperCollins Publishers (Australia) Pty Ltd'], 'isbn': ['0002174049'], 'number_of_pages': 120, 'short_title': u'netherlandish and german ', 'normalized_title': u'netherlandish and german paintings national gallery schools of painting', 'full_title': u'Netherlandish and German Paintings (National Gallery Schools of Painting)', 'titles': [u'Netherlandish and German Paintings (National Gallery Schools of Painting)', u'netherlandish and german paintings national gallery schools of painting', u'Netherlandish and German Paintings', u'netherlandish and german paintings'], 'publish_date': u'1985', 'authors': [u'Alistair Smith']}
+    marc = {'publisher': [u'National Gallery in association with W. Collins'], 'isbn': [u'0002174049'], 'short_title': u'early netherlandish and g', 'normalized_title': u'early netherlandish and german paintings', 'full_title': u'Early Netherlandish and German paintings', 'titles': [u'Early Netherlandish and German paintings', u'early netherlandish and german paintings'], 'publish_date': '1985', 'authors': [{'db_name': u'National Gallery (Great Britain)', 'name': u'National Gallery (Great Britain)', 'entity_type': 'org'}], 'number_of_pages': 116, 'by_statement': 'Alistair Smith.', 'source_record_loc': 'marc_records_scriblio_net/part17.dat:170029527:1210'}
+    threshold = 735
+    assert attempt_merge(amazon, marc, threshold)
+
+@pytest.mark.skip(reason="Did not pass when rescuing tests. Check thresholds.")
+def test_merge6():
+    amazon = {'publishers': [u'Fount'], 'isbn_10': ['0002176157'], 'number_of_pages': 224, 'short_title': u'basil hume', 'normalized_title': u'basil hume', 'full_title': u'Basil Hume', 'titles': [u'Basil Hume', u'basil hume'], 'publish_date': u'1986', 'authors': [(u'Tony Castle', u'Editor')]}
+    marc = {'publisher': [u'Collins'], 'isbn_10': [u'0002176157'], 'short_title': u'basil hume  a portrait', 'normalized_title': u'basil hume  a portrait', 'full_title': u'Basil Hume : a portrait', 'titles': [u'Basil Hume : a portrait', u'basil hume  a portrait'], 'number_of_pages': 158, 'publish_date': '1986', 'by_statement': 'edited by Tony Castle.', 'source_record_loc': 'marc_records_scriblio_net/part19.dat:39883132:951'}
+    threshold = 735
+    assert attempt_merge(amazon, marc, threshold)
+
+def test_merge7():
+    amazon = {'publishers': [u'HarperCollins Publishers Ltd'], 'isbn': ['0002176319'], 'number_of_pages': 256, 'short_title': u'pucklers progress', 'normalized_title': u'pucklers progress', 'full_title': u"Puckler's Progress", 'titles': [u"Puckler's Progress", u'pucklers progress'], 'publish_date': u'1987', 'authors': [u'Flora Brennan']}
+    marc = {'publisher': [u'Collins'], 'isbn': [u'0002176319'], 'short_title': u'pucklers progress  the ad', 'normalized_title': u'pucklers progress  the adventures of prince puckler muskau in england wales and ireland as told in letters to his former wife 1826 9', 'full_title': u"Puckler's progress : the adventures of Prince Pu\u0308ckler-Muskau in England, Wales, and Ireland as told in letters to his former wife, 1826-9", 'titles': [u"Puckler's progress : the adventures of Prince Pu\u0308ckler-Muskau in England, Wales, and Ireland as told in letters to his former wife, 1826-9", u'pucklers progress  the adventures of prince puckler muskau in england wales and ireland as told in letters to his former wife 1826 9'], 'publish_date': '1987', 'authors': [{'name': u'Pu\u0308ckler-Muskau, Hermann Furst von', 'title': u'Furst von', 'death_date': u'1871.', 'db_name': u'Pu\u0308ckler-Muskau, Hermann Furst von 1785-1871.', 'birth_date': u'1785', 'personal_name': u'Pu\u0308ckler-Muskau, Hermann', 'entity_type': 'person'}], 'number_of_pages': 254, 'by_statement': 'translated by Flora Brennan.', 'source_record_loc': 'marc_records_scriblio_net/part19.dat:148554594:1050'}
+    threshold = 735
+    assert attempt_merge(amazon, marc, threshold)
+
+def test_merge8():
+    amazon = {'publishers': [u'Shambhala'], 'isbn': [u'1590301390'], 'number_of_pages': 144, 'short_title': u'the spiritual teaching of', 'normalized_title': u'the spiritual teaching of ramana maharshi', 'full_title': u'The Spiritual Teaching of Ramana Maharshi', 'titles': [u'The Spiritual Teaching of Ramana Maharshi', u'the spiritualteaching of ramana maharshi', u'Spiritual Teaching of Ramana Maharshi', u'spiritual teaching of ramana maharshi'], 'publish_date': u'2004', 'authors': [u'Ramana Maharshi.']}
+    marc = {'isbn': [], 'number_of_pages': 180, 'short_title': 'the spiritual teaching of', 'normalized_title': 'the spiritual teaching of mary of the incarnation', 'full_title': 'The spiritual teaching of Mary of the Incarnation', 'titles': ['The spiritual teaching of Mary of the Incarnation', 'the spiritual teaching of mary of the incarnation', 'spiritual teaching of Mary of the Incarnation', 'spiritual teaching of mary of the incarnation'], 'publish_date': '1963', 'publish_country': 'nyu', 'authors': [{'db_name': 'Jett\u00e9, Fernand.', 'name': u'Jett\u00e9, Fernand.'}]}
+    threshold = 735
+    assert not attempt_merge(amazon, marc, threshold)
diff --git a/ia-legacy-importer/merge/test_merge.py b/ia-legacy-importer/merge/test_merge.py
new file mode 100644
index 00000000..8a6868eb
--- /dev/null
+++ b/ia-legacy-importer/merge/test_merge.py
@@ -0,0 +1,119 @@
+import pytest
+
+from openlibrary.catalog.merge.merge import (
+        attempt_merge,
+        compare_authors, compare_publisher,
+        full_title, build_titles, compare_title)
+
+""" These tests seem to be duplicates of those in test_amazon.py,
+    which in turn are duplicates of methods that are actually used 
+    by Open Library in openlibrary.catalog.merge.merge_marc
+    Investigate and clean up!
+    """
+
+def test_compare_authors_by_statement():
+    # Not clear how the amazon record gets to be in this format, but that's what the current code works with.`
+    amazon = {'authors': ['Alistair Smith']}
+    marc = {'authors': [{'db_name': u'National Gallery (Great Britain)', 'name': u'National Gallery (Great Britain)', 'entity_type': 'org'}], 'by_statement': 'Alistair Smith.'}
+    assert compare_authors(amazon, marc) == ('main', 'exact match', 125)
+
+def test_compare_publisher():
+    amazon = { 'publisher': 'foo' }
+    amazon2 = { 'publisher': 'bar' }
+    marc = { 'publishers': ['foo'] }
+    marc2 = { 'publishers': ['foo', 'bar'] }
+    assert compare_publisher({}, {}) == ('publisher', 'either missing', 0)
+    assert compare_publisher(amazon, {}) == ('publisher', 'either missing', 0)
+    assert compare_publisher({}, marc) == ('publisher', 'either missing', 0)
+    assert compare_publisher(amazon, marc) == ('publisher', 'match', 100)
+    assert compare_publisher(amazon2, marc) == ('publisher', 'mismatch', -25)
+    assert compare_publisher(amazon2, marc2) == ('publisher', 'match', 100)
+
+def test_full_title():
+    assert full_title({ 'title': "Hamlet"}) == "Hamlet"
+    edition = {
+        'title': 'Flatland',
+        'subtitle': 'A Romance of Many Dimensions',
+    }
+    assert full_title(edition) == "Flatland A Romance of Many Dimensions"
+
+def test_merge_titles():
+    marc = {
+        'title_with_subtitles': 'Spytime : the undoing of James Jesus Angleton : a novel',
+        'title': 'Spytime',
+        'full_title': 'Spytime : the undoing of James Jesus Angleton : a novel',
+    }
+    amazon = {
+        'subtitle': 'The Undoing oF James Jesus Angleton',
+        'title': 'Spytime',
+    }
+
+    amazon = build_titles(full_title(amazon))
+    marc = build_titles(marc['title_with_subtitles'])
+    assert amazon['short_title'] == marc['short_title']
+    assert compare_title(amazon, marc) == ('full-title', 'contained within other title', 350)
+
+def test_merge_titles2():
+    amazon = {'title': u'Sea Birds Britain Ireland'}
+    marc = {
+        'title_with_subtitles': u'seabirds of Britain and Ireland',
+        'title': u'seabirds of Britain and Ireland',
+        'full_title': u'The seabirds of Britain and Ireland',
+    }
+    amazon = build_titles(full_title(amazon))
+    marc = build_titles(marc['title_with_subtitles'])
+    assert compare_title(amazon, marc) == ('full-title', 'exact match', 600)
+
+@pytest.mark.skip(reason="Did not pass when rescuing tests. Check thresholds.")
+def test_merge():
+    amazon = {'publisher': u'Collins', 'isbn_10': ['0002167360'], 'number_of_pages': 120, 'short_title': u'souvenirs', 'normalized_title': u'souvenirs', 'full_title': u'Souvenirs', 'titles': [u'Souvenirs', u'souvenirs'], 'publish_date': u'1975', 'authors': [(u'David Hamilton', u'Photographer')]}
+    marc = {'publisher': [u'Collins'], 'isbn_10': [u'0002167360'], 'short_title': u'souvenirs', 'normalized_title': u'souvenirs', 'full_title': u'Souvenirs', 'titles': [u'Souvenirs', u'souvenirs'], 'publish_date': '1978', 'authors': [{'birth_date': u'1933', 'db_name': u'Hamilton, David 1933-', 'entity_type': 'person', 'name': u'Hamilton, David', 'personal_name': u'Hamilton, David'}], 'source_record_loc': 'marc_records_scriblio_net/part11.dat:155728070:617', 'number_of_pages': 120}
+
+    threshold = 735
+    assert attempt_merge(amazon, marc, threshold)
+
+@pytest.mark.skip(reason="Should be tested on openlibrary.catalog.merge.merge_marc.") 
+def test_merge2():
+    amazon = {'publisher': u'Collins', 'isbn_10': ['0002167530'], 'number_of_pages': 287, 'short_title': u'sea birds britain ireland', 'normalized_title': u'sea birds britain ireland', 'full_title': u'Sea Birds Britain Ireland', 'titles': [u'Sea Birds Britain Ireland', u'sea birds britain ireland'], 'publish_date': u'1975', 'authors': [(u'Stanley Cramp', u'Author')]}
+    marc = {'publisher': [u'Collins'], 'isbn_10': [u'0002167530'], 'short_title': u'seabirds of britain and i', 'normalized_title': u'seabirds of britain and ireland', 'full_title': u'seabirds of Britain and Ireland', 'titles': [u'seabirds of Britain and Ireland', u'seabirds of britain and ireland'], 'publish_date': '1974', 'authors': [{'db_name': u'Cramp, Stanley.', 'entity_type': 'person', 'name': u'Cramp, Stanley.', 'personal_name': u'Cramp, Stanley.'}], 'source_record_loc': 'marc_records_scriblio_net/part08.dat:61449973:855'}
+
+    threshold = 735
+    assert attempt_merge(amazon, marc, threshold)
+
+@pytest.mark.skip(reason="Did not pass when rescuing tests. Check thresholds.")
+def test_merge3():
+    amazon = {'publisher': u'Intl Specialized Book Service Inc', 'isbn_10': ['0002169770'], 'number_of_pages': 207, 'short_title': u'women of the north', 'normalized_title': u'women of the north', 'full_title': u'Women of the North', 'titles': [u'Women of the North', u'women of the north'], 'publish_date': u'1985', 'authors': [(u'Jane Wordsworth', u'Author')]}
+    marc = {'publisher': [u'Collins', u'Exclusive distributor ISBS'], 'isbn_10': [u'0002169770'], 'short_title': u'women of the north', 'normalized_title': u'women of the north', 'full_title': u'Women of the North', 'titles': [u'Women of the North', u'women of the north'], 'publish_date': '1981', 'number_of_pages': 207, 'authors': [{'db_name': u'Wordsworth, Jane.', 'entity_type': 'person', 'name': u'Wordsworth, Jane.', 'personal_name': u'Wordsworth, Jane.'}], 'source_record_loc': 'marc_records_scriblio_net/part17.dat:110989084:798'}
+
+    threshold = 735
+    assert attempt_merge(amazon, marc, threshold)
+
+@pytest.mark.skip(reason="Did not pass when rescuing tests. Check thresholds.")
+def test_merge4():
+    amazon = {'publisher': u'HarperCollins Publishers Ltd', 'isbn_10': ['0002173433'], 'number_of_pages': 128, 'short_title': u'd day to victory', 'normalized_title': u'd day to victory', 'full_title': u'D-Day to Victory', 'titles': [u'D-Day to Victory', u'd day to victory'], 'publish_date': u'1984', 'authors': [(u'Wynfod Vaughan-Thomas', u'Editor, Introduction')]}
+    marc = {'publisher': [u'Collins'], 'isbn_10': [u'0002173433'], 'short_title': u'great front pages  d day ', 'normalized_title': u'great front pages  d day to victory 1944 1945', 'full_title': u'Great front pages : D-Day to victory 1944-1945', 'titles': [u'Great front pages : D-Day to victory 1944-1945', u'great front pages  dday to victory 1944 1945'], 'publish_date': '1984', 'number_of_pages': 128, 'by_statement': 'introduced by Wynford Vaughan-Thomas.', 'source_record_loc': 'marc_records_scriblio_net/part17.dat:102360356:983'}
+
+    threshold = 735
+    assert attempt_merge(amazon, marc, threshold)
+
+@pytest.mark.skip(reason="Should be tested on openlibrary.catalog.merge.merge_marc.") 
+def test_merge5():
+    amazon = {'publisher': u'HarperCollins Publishers (Australia) Pty Ltd', 'isbn_10': ['0002174049'], 'number_of_pages': 120, 'short_title': u'netherlandish and german ', 'normalized_title': u'netherlandish and german paintings national gallery schools of painting', 'full_title': u'Netherlandish and German Paintings (National Gallery Schools of Painting)', 'titles': [u'Netherlandish and German Paintings (National Gallery Schools of Painting)', u'netherlandish and german paintings national gallery schools of painting', u'Netherlandish and German Paintings', u'netherlandish and german paintings'], 'publish_date': u'1985', 'authors': [(u'Alistair Smith', u'Author')]}
+    marc = {'publisher': [u'National Gallery in association with W. Collins'], 'isbn_10': [u'0002174049'], 'short_title': u'early netherlandish and g', 'normalized_title': u'early netherlandish and german paintings', 'full_title': u'Early Netherlandish and German paintings', 'titles': [u'Early Netherlandish and German paintings', u'early netherlandish and german paintings'], 'publish_date': '1985', 'authors': [{'db_name': u'National Gallery (Great Britain)', 'name': u'National Gallery (Great Britain)', 'entity_type': 'org'}], 'number_of_pages': 116, 'by_statement': 'Alistair Smith.', 'source_record_loc': 'marc_records_scriblio_net/part17.dat:170029527:1210'}
+    threshold = 735
+    assert attempt_merge(amazon, marc, threshold)
+
+@pytest.mark.skip(reason="Did not pass when rescuing tests. Check thresholds.")
+def test_merge6():
+    amazon = {'publisher': u'Fount', 'isbn_10': ['0002176157'], 'number_of_pages': 224, 'short_title': u'basil hume', 'normalized_title': u'basil hume', 'full_title': u'Basil Hume', 'titles': [u'Basil Hume', u'basil hume'], 'publish_date': u'1986', 'authors': [(u'Tony Castle', u'Editor')]}
+    marc = {'publisher': [u'Collins'], 'isbn_10': [u'0002176157'], 'short_title': u'basil hume  a portrait', 'normalized_title': u'basil hume  a portrait', 'full_title': u'Basil Hume : a portrait', 'titles': [u'Basil Hume : a portrait', u'basil hume  a portrait'], 'number_of_pages': 158, 'publish_date': '1986', 'by_statement': 'edited by Tony Castle.', 'source_record_loc': 'marc_records_scriblio_net/part19.dat:39883132:951'}
+    threshold = 735
+    assert attempt_merge(amazon, marc, threshold)
+
+@pytest.mark.skip(reason="Should be tested on openlibrary.catalog.merge.merge_marc.") 
+def test_merge7():
+    amazon = {'publisher': u'HarperCollins Publishers Ltd', 'isbn_10': ['0002176319'], 'number_of_pages': 256, 'short_title': u'pucklers progress', 'normalized_title': u'pucklers progress', 'full_title': u"Puckler's Progress", 'titles': [u"Puckler's Progress", u'pucklers progress'], 'publish_date': u'1987', 'authors': [(u'Flora Brennan', u'Editor')]}
+    marc = {'publisher': [u'Collins'], 'isbn_10': [u'0002176319'], 'short_title': u'pucklers progress  the ad', 'normalized_title': u'pucklers progress  the adventures of prince puckler muskau in england wales and ireland as told in letters to his former wife 1826 9', 'full_title': u"Puckler's progress : the adventures of Prince Pu\u0308ckler-Muskau in England, Wales, and Ireland as told in letters to his former wife, 1826-9", 'titles': [u"Puckler's progress : the adventures of Prince Pu\u0308ckler-Muskau in England, Wales, and Ireland as told in letters to his former wife, 1826-9", u'pucklers progress  the adventures of prince puckler muskau in england wales and ireland as told in letters to his former wife 1826 9'], 'publish_date': '1987', 'authors': [{'name': u'Pu\u0308ckler-Muskau, Hermann Furst von', 'title': u'Furst von', 'death_date': u'1871.', 'db_name': u'Pu\u0308ckler-Muskau, Hermann Furst von 1785-1871.', 'birth_date': u'1785', 'personal_name': u'Pu\u0308ckler-Muskau, Hermann', 'entity_type': 'person'}], 'number_of_pages': 254, 'by_statement': 'translated by Flora Brennan.', 'source_record_loc': 'marc_records_scriblio_net/part19.dat:148554594:1050'}
+    threshold = 735
+    assert attempt_merge(amazon, marc, threshold)
+
diff --git a/ia-legacy-importer/merge/test_merge_marc.py b/ia-legacy-importer/merge/test_merge_marc.py
new file mode 100644
index 00000000..077ad055
--- /dev/null
+++ b/ia-legacy-importer/merge/test_merge_marc.py
@@ -0,0 +1,151 @@
+import pytest
+from openlibrary.catalog.merge.merge_marc import attempt_merge, build_marc, build_titles, compare_authors
+
+@pytest.mark.xfail(reason='Taken from openlibrary.catalog.merge.merge.compare_authors -- does not find a match.')
+def test_compare_authors_by_statement():
+    # requires db_name to be present on both records.
+    rec1 = {
+            'full_title': 'Full Title, required',
+            'authors': [{
+                'name': 'Alistair Smith',
+                'db_name': 'Alistair Smith'}]}
+    rec2 = {
+            'full_title': 'A different Full Title, only matching authors here.',
+            'authors': [{
+                'db_name': u'National Gallery (Great Britain)',
+                'name': u'National Gallery (Great Britain)',
+                'entity_type': 'org'}],
+            'by_statement': 'Alistair Smith.'}
+
+    result = compare_authors(build_marc(rec1), build_marc(rec2))
+    # This expected result taken from the amazon and merge versions of compare_author,
+    # Current merge_marc.compare_authors() does not take by_statement into account.
+    assert result == ('main', 'exact match', 125)
+
+def test_build_titles():
+    # Used by build_marc()
+    a = 'This is a title.'
+    normalized = 'this is a title'
+    result = build_titles(a)
+    assert isinstance(result['titles'], list)
+    assert result['full_title'] == a
+    assert result['short_title'] == normalized
+    assert result['normalized_title'] == normalized
+    assert result['titles'] == ['This is a title.', 'this is a title']
+
+def test_build_titles_complex():
+    # TODO: There are issues with this method
+    # see https://github.com/internetarchive/openlibrary/issues/2410
+    a = 'A test full title : subtitle (parens).'
+    b = 'A test full title : subtitle (parens)'
+    a_result = build_titles(a)
+    a_titles = a_result['titles']
+    assert a in a_titles
+
+    b_result = build_titles(b)
+    b_titles = b_result['titles']
+    assert b in b_titles
+
+    common_titles = [
+            'a test full title subtitle (parens)',
+            'test full title subtitle (parens)',
+            ]
+    for title in common_titles:
+        assert title in a_titles
+        assert title in b_titles
+
+    # Missing variations:
+    #assert 'test full title subtitle' in a_titles
+    assert 'test full title subtitle' in b_titles
+    #assert 'a test full title subtitle' in a_titles
+    assert 'a test full title subtitle' in b_titles
+
+    # Check for duplicates:
+    assert len(a_titles) == len(set(a_titles))
+    #assert len(b_titles) == len(set(b_titles))
+
+def test_build_marc():
+    # used in add_book.load() when trying to find an existing edition match
+    edition = {
+            'title': 'A test title (parens)',
+            'full_title': 'A test full title : subtitle (parens).',  # required, and set by add_book.load()
+            'source_records': ['ia:test-source']
+            }
+    result = build_marc(edition)
+    assert isinstance(result['titles'], list)
+    assert result['isbn'] == []
+    assert result['normalized_title'] == 'a test full title subtitle (parens)'
+    assert result['short_title'] == 'a test full title subtitl'
+
+def test_author_contrib():
+    rec1 = {'authors': [{'db_name': u'Bruner, Jerome S.', 'name': u'Bruner, Jerome S.'}],
+    'full_title': u'Contemporary approaches to cognition a symposium held at the University of Colorado.',
+    'number_of_pages': 210,
+    'publish_country': 'xxu',
+    'publish_date': '1957',
+    'publishers': [u'Harvard U.P']}
+
+    rec2 = {'authors': [{'db_name': u'University of Colorado (Boulder campus). Dept. of Psychology.',
+                'name': u'University of Colorado (Boulder campus). Dept. of Psychology.'}],
+    'contribs': [{'db_name': u'Bruner, Jerome S.', 'name': u'Bruner, Jerome S.'}],
+    'full_title': u'Contemporary approaches to cognition a symposium held at the University of Colorado',
+    'lccn': ['57012963'],
+    'number_of_pages': 210,
+    'publish_country': 'mau',
+    'publish_date': '1957',
+    'publishers': [u'Harvard University Press']}
+
+    e1 = build_marc(rec1)
+    e2 = build_marc(rec2)
+
+    assert compare_authors(e1, e2) == ('authors', 'exact match', 125)
+    threshold = 875
+    assert attempt_merge(e1, e2, threshold) is True
+
+def test_merge():
+    bpl = {'authors': [{'birth_date': u'1897',
+                      'db_name': u'Green, Constance McLaughlin 1897-',
+                      'entity_type': 'person',
+                      'name': u'Green, Constance McLaughlin',
+                      'personal_name': u'Green, Constance McLaughlin'}],
+         'full_title': u'Eli Whitney and the birth of American technology',
+         'isbn': [u'188674632X'],
+         'normalized_title': u'eli whitney and the birth of american technology',
+         'number_of_pages': 215,
+         'publish_date': '1956',
+         'publishers': [u'HarperCollins', u'[distributed by Talman Pub.]'],
+         'short_title': u'eli whitney and the birth',
+         'source_record_loc': 'bpl101.mrc:0:1226',
+         'titles': [u'Eli Whitney and the birth of American technology',
+                    u'eli whitney and the birth of american technology']}
+    lc = {'authors': [{'birth_date': u'1897',
+                     'db_name': u'Green, Constance McLaughlin 1897-',
+                     'entity_type': 'person',
+                     'name': u'Green, Constance McLaughlin',
+                     'personal_name': u'Green, Constance McLaughlin'}],
+        'full_title': u'Eli Whitney and the birth of American technology.',
+        'isbn': [],
+        'normalized_title': u'eli whitney and the birth of american technology',
+        'number_of_pages': 215,
+        'publish_date': '1956',
+        'publishers': ['Little, Brown'],
+        'short_title': u'eli whitney and the birth',
+        'source_record_loc': 'marc_records_scriblio_net/part04.dat:119539872:591',
+        'titles': [u'Eli Whitney and the birth of American technology.',
+                   u'eli whitney and the birth of american technology']}
+
+    assert compare_authors(bpl, lc) == ('authors', 'exact match', 125)
+    threshold = 875
+    assert attempt_merge(bpl, lc, threshold) is True
+
+
+@pytest.mark.skip(reason="Failed because test data authors do not have `db_name`, may be a sign of a real issue. Also fails on threshold.")
+def test_merge2():
+    amazon = {'publishers': [u'Collins'], 'isbn_10': ['0002167530'], 'number_of_pages': 287, 'short_title': u'sea birds britain ireland', 'normalized_title': u'sea birds britain ireland', 'full_title': u'Sea Birds Britain Ireland', 'titles': [u'Sea Birds Britain Ireland', u'sea birds britain ireland'], 'publish_date': u'1975',
+            'authors': [{'name': 'Stanley Cramp', 'db_name': 'Cramp, Stanley'}]}
+
+    marc = {'publisher': [u'Collins'], 'isbn_10': [u'0002167530'], 'short_title': u'seabirds of britain and i', 'normalized_title': u'seabirds of britain and ireland', 'full_title': u'seabirds of Britain and Ireland', 'titles': [u'seabirds of Britain and Ireland', u'seabirds of britain and ireland'], 'publish_date': '1974', 'authors': [{'db_name': u'Cramp, Stanley.', 'entity_type': 'person', 'name': u'Cramp, Stanley.', 'personal_name': u'Cramp, Stanley.'}], 'source_record_loc': 'marc_records_scriblio_net/part08.dat:61449973:855'}
+    threshold = 875
+    # build_marc() will place all isbn_ types in the 'isbn' field.
+    # compare_author_fields() expects all authors to have a db_name
+    assert attempt_merge(build_marc(amazon), build_marc(marc), threshold, debug=True)
diff --git a/ia-legacy-importer/merge/test_names.py b/ia-legacy-importer/merge/test_names.py
new file mode 100644
index 00000000..e444fa96
--- /dev/null
+++ b/ia-legacy-importer/merge/test_names.py
@@ -0,0 +1,52 @@
+#-*- coding: utf-8 -*-
+import pytest
+from openlibrary.catalog.merge import names
+
+samples = [
+    ("John Smith", "Smith, John"),
+    ("Diane DiPrima", "Di Prima, Diane."),
+#   ("Buckley, William F.", "William F. Buckley Jr."),
+# TODO:    ("Duong Thu Huong", u"Dương, Thu Hương."),
+#    ("Deanne Spears", "Milan Spears, Deanne."),
+#    ("Victor Erofeyev", "Erofeev, V. V."),
+#    ("Courcy Catherine De", "De Courcy, Catherine."),
+#    ("Andy Mayer", "Mayer, Andrew"),
+#    ("Neelam Saran Gour", "Gour, Neelum Saran"),
+#    ("Bankim Chandra Chatterjee", "Chatterji, Bankim Chandra "),
+#    ("Mrs. Humphrey Ward", "Ward, Humphry Mrs."),
+#    ("William F. Buckley Jr.", "Buckley, William F."),
+#    ("John of the Cross Saint", "Saint John of the Cross"),
+#    ('Louis Philippe', 'Louis Philippe King of the French'),
+#    ('Gregory of Tours', 'Gregory Saint, Bishop of Tours'),
+#    ('Marjorie Allen', 'Allen, Marjory Gill Allen, Baroness'),
+    ('Shewbridge                   Ea', 'Shewbridge, Edythe.'),
+    ('Maitland-Jones               Jf', 'Maitland-Jones, J. F.'),
+    ('Quine                        Wv', 'Quine, W. V.'),
+    ('Auden                        Wh', 'Auden, W. H.'),
+    ('Evans                        Cm', 'Evans, Charles M.'),
+    ('Buckwalter                   L', 'Buckwalter, Len.'),
+    ('Bozic                        Sm', 'Bozic, S. M.'),
+    ('Lawrence                     Dh', 'Lawrence, D. H.'),
+    ('De Grazia                    T', 'De Grazia'),
+    ('Purcell                      R', 'Purcell, Rosamond Wolff.'),
+    ('Warring                      Rh', 'Warring, R. H.'),
+]
+
+@pytest.mark.parametrize('amazon,marc', samples)
+def test_names(amazon, marc):
+    assert names.match_name(amazon, marc)
+
+def test_flip_name():
+    assert names.flip_name("Smith, John") == "John Smith"
+    assert names.flip_name("John Smith") == None
+
+def test_compare_part():
+    assert names.compare_part("J", "John")
+    assert names.compare_part("John", "J")
+    assert not names.compare_part("John", "Jack")
+    assert names.compare_part("j", "John")
+    assert not names.compare_part("X", "John")
+
+def test_remove_trailing_dot():
+#   assert names.remove_trailing_dot("Jr.") == "Jr."
+    assert names.remove_trailing_dot("John Smith.") == "John Smith"
diff --git a/ia-legacy-importer/merge/test_normalize.py b/ia-legacy-importer/merge/test_normalize.py
new file mode 100644
index 00000000..3270d2cf
--- /dev/null
+++ b/ia-legacy-importer/merge/test_normalize.py
@@ -0,0 +1,28 @@
+# -*- coding: utf-8 -*-
+import pytest
+from openlibrary.catalog.merge.normalize import normalize
+
+def test_normalize():
+    assert normalize('Hello this is a           Title') == 'hello this is a title'
+
+def test_normalize_titles_with_and():
+    a = 'This and That'
+    b = 'This & that'
+    norm = "this and that"
+    assert normalize(a) == normalize(b)
+    assert normalize(b) == norm
+
+def test_normalize_unicode():
+    a = u'Kitāb Yatīmat ud-Dahr' 
+    assert normalize(a) == u'kitāb yatīmat ud dahr'
+
+@pytest.mark.skip(reason="Stripping these mnemonics is not implemented. Unsure whether this is a current problem with titles.")
+def test_normalize_replace_MARCMaker_mnemonics():
+    # see http://www.loc.gov/marc/mnemonics.html
+    a = "The La{dotb}t{macr}a{mlrhring}if al-ma{mllhring}{macr}arif of Tha{mllhring} {macr}alibi. The book of curious and entertaining information"
+    b = u"The La\xf2t\xe5a\xaeif al-ma\xb0\xe5arif of Tha\xb0 \xe5alibi. The book of curious and entertaining information"
+    assert normalize(a) == normalize(b)
+
+    a = "Tha{mllhring}{macr}alib{macr}i, {mllhring}Abd al-Malik ibn Mu{dotb}hammad 961 or 2-1037 or 8."
+    b = u"Tha\xb0\xe5alib\xe5i, \xb0Abd al-Malik ibn Mu\xf2hammad 961 or 2-1037 or 8."
+    assert normalize(a) == normalize(b)
diff --git a/ia-legacy-importer/oca/__init__.py b/ia-legacy-importer/oca/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/ia-legacy-importer/oca/parse.py b/ia-legacy-importer/oca/parse.py
new file mode 100644
index 00000000..bedbe673
--- /dev/null
+++ b/ia-legacy-importer/oca/parse.py
@@ -0,0 +1,126 @@
+from __future__ import print_function
+import sys
+from six.moves import cStringIO as StringIO
+from xml.parsers.expat import error as xml_error
+from elementtree import ElementTree
+from types import *
+from lang import *
+
+def input_items (input):
+	def buf2elt (buf):
+		buf.seek (0, 0)
+		elt = None
+		try:
+			et = ElementTree.parse (buf)
+			elt = et.getroot ()
+		except xml_error as e:
+			elt = None
+			warn ("ignoring XML error: %s" % e)
+		buf.close ()
+		return elt
+
+	buf = None
+	bufpos = None
+	for (line, linepos) in lines_positions (input):
+		if line.startswith('<?xml '):
+			if buf is not None:
+				yield (buf2elt (buf), bufpos)
+			buf = StringIO ()
+			bufpos = None
+		else:
+			if buf: # this lets us start anywhere and pick up the next record
+				if bufpos is None:
+					bufpos = linepos
+				buf.write (line)
+	if buf is not None:
+		yield (buf2elt (buf), bufpos)
+
+def setval (x, v, k):
+	x[k] = v
+
+def addval (x, v, k, translate=lambda x: x):
+	v = translate (v)
+	vv = x.get (k)
+	if vv:
+		vv.append (v)
+	else:
+		x[k] = [v]
+
+def concval (x, v, k, sep=" "):
+	vv = x.get (k)
+	if vv:
+		x[k] = vv + sep + v
+	else:
+		x[k] = v
+
+def thingify_with (field):
+	return lambda v: { field: v }
+
+element_dispatch = {
+	'title': (setval, 'title'),
+	'creator': (addval, 'authors', thingify_with ('name')),
+	'subject': (addval, 'subject'),
+	'description': (concval, 'description', "; "),
+	'publisher': (setval, 'publisher'),
+	'date': (setval, 'publish_date'),
+	# if can be a language_code, enter that and also provide language, else store as language
+	'language': (setval, 'language'),
+	'sponsor': (setval, 'scan_sponsor'),
+	'contributor': (setval, 'scan_contributor'),
+	'identifier': (setval, 'oca_identifier')
+	}
+
+ignored = {}
+
+def parse_item (r):
+	global ignored
+	e = {}
+	for field in r:
+		text = field.text
+		if text is None: continue
+		tag = field.tag
+		action = element_dispatch.get (tag)
+		if action:
+			f = action[0]
+			args = action[1:]
+			v = encode_val (text)
+			f (e, v, *args)
+		else:
+			count = ignored.get (tag) or 0
+			ignored[tag] = count + 1
+	return e
+
+limit = 1000
+def test_input (input):
+	n = 0
+	global ignored
+	ignored = {}
+	for (r,pos) in input_items (input):
+		# if limit and n == limit: break
+		if r is None: continue
+		o = parse_item (r)
+		print(o)
+		n += 1
+		if n % 100 == 0:
+			warn ("...... read %d records" % n)
+	warn ("ignored:")
+	for (tag,count) in ignored.iteritems ():
+		warn ("\t%d\t%s" % (count, tag))
+	warn ("done.  read %d records" % n)
+
+def parser (input):
+	for (r,pos) in input_items (input):
+		if r is None: continue
+		d = parse_item (r)
+		d["source_record_pos"] = pos
+		yield d
+
+def encode_val (v):
+	if isinstance (v, StringType):
+		return v
+	elif isinstance (v, UnicodeType):
+		return v.encode ('utf8')
+	else:
+		die ("couldn't encode value: %s" % repr (v))
+
+# parse_input (sys.stdin)
diff --git a/ia-legacy-importer/olwrite.py b/ia-legacy-importer/olwrite.py
new file mode 100644
index 00000000..9ad23f33
--- /dev/null
+++ b/ia-legacy-importer/olwrite.py
@@ -0,0 +1,49 @@
+from __future__ import print_function
+import web
+from infogami.infobase import client
+import simplejson
+import sys
+
+web.ctx.ip = '127.0.0.1'
+
+class Infogami:
+    def __init__(self, host, sitename='openlibrary.org'):
+        self.conn = client.connect(type='remote', base_url=host)
+        self.sitename = sitename
+
+    def _request(self, path, method, data):
+        out = self.conn.request(self.sitename, path, method, data)
+        out = simplejson.loads(out)
+        if out['status'] == 'fail':
+            raise Exception(out['message'])
+        return out
+
+    def login(self, username, password):
+        return self._request('/account/login', 'POST', dict(username=username, password=password))
+
+    def write(self, query, comment='', machine_comment=None):
+        query = simplejson.dumps(query)
+        return self._request('/write', 'POST', dict(query=query, comment=comment, machine_comment=machine_comment))
+
+    def new_key(self, type):
+        return self._request('/new_key', 'GET', dict(type=type))['result']
+
+def add_to_database(infogami, q, loc):
+# sample return
+#    {'status': 'ok', 'result': {'updated': [], 'created': ['/b/OL13489313M']}}
+
+    for a in (i for i in q.get('authors', []) if 'key' not in i):
+        a['key'] = infogami.new_key('/type/author')
+
+    q['key'] = infogami.new_key('/type/edition')
+    ret = infogami.write(q, comment='initial import', machine_comment=loc)
+    assert ret['status'] == 'ok'
+    keys = [ i for i in ret['result']['created'] if i.startswith('/b/')]
+    try:
+        assert len(keys) == 1 or keys[0] == q['key']
+    except AssertionError:
+        print(q)
+        print(ret)
+        print(keys)
+        raise
+    return q['key']
diff --git a/ia-legacy-importer/onix/ONIX_BookProduct_CodeLists.xsd b/ia-legacy-importer/onix/ONIX_BookProduct_CodeLists.xsd
new file mode 100644
index 00000000..82e46901
--- /dev/null
+++ b/ia-legacy-importer/onix/ONIX_BookProduct_CodeLists.xsd
@@ -0,0 +1,13467 @@
+<?xml version="1.0" encoding="utf-8"?>
+<!--
+**************************************************
+*                                                *
+*               ONIX INTERNATIONAL               *
+*                                                *
+*                   XML SCHEMA                   *
+*           CODE LIST DATA TYPES MODULE          *
+*                                                *
+*                    ISSUE: 6                    *
+*                                                *
+*                 Status: RELEASED               *
+*            Release date: 2006-07-18            *
+*                                                *
+* Orig filename ONIX-INTERNATIONAL-CODELISTS.XSD *
+*                                                *
+*          Original author: Francis Cave         *
+*                                                *
+*              (c) 2003-2006 EDItEUR             *
+*             http://www.editeur.org/            *
+*                                                *
+**************************************************
+
+N.B. PRIMARILY DESIGNED FOR USE WITH ONIX SCHEMAS
+
+TERMS AND CONDITIONS OF USE OF THE ONIX PRODUCT INFORMATION MESSAGE XML SCHEMA
+
+All ONIX standards and documentation are copyright materials, made available 
+free of charge for general use.  If you use the ONIX International Code Lists, 
+you will be deemed to have accepted these terms and conditions:
+
+1.  You agree that you will not add to, delete from or amend the ONIX International 
+Code Lists, any part of the Code Lists except for strictly internal 
+use in your own organisation.
+
+2.  You agree that if you wish to add to, amend, or make extracts of the 
+Code Lists for any purpose that is not strictly internal to your own organisation, 
+you will in the first instance notify EDItEUR and allow EDItEUR to review 
+and comment on your proposed use, in the interest of securing an orderly 
+development of the Code Lists for the benefit of other users.
+
+If you do not accept these terms, you must not use the ONIX International 
+Code Lists.
+
+The latest release of this Module and all documentation associated with the 
+ONIX International Code Lists are available from the EDItEUR web site, where may 
+also be found details of how to contact EDItEUR for advice on the use of this 
+Module. The URL for the EDItEUR web site is:
+
+http://www.editeur.org/
+
+
+
+MODULE REVISION HISTORY (IN REVERSE CHRONOLOGICAL ORDER)
+
+2008-07-18: Module for public release based upon the ONIX International
+            Code Lists Issue 6 (July 2006)
+
+2005-11-28: Module for public release based upon the ONIX International
+            Code Lists Issue 5 (November 2005)
+
+2005-02-10: Module for public release based upon the ONIX International
+            Code Lists Issue 4 (February 2005)
+
+2004-11-10: Module for public release based upon the ONIX International 
+            Code Lists Issue 3 (August 2004)
+
+2004-08-10: Second Draft Module based upon the ONIX International 
+            Code Lists Issue 3 (August 2004)
+
+2003-12-30: First Draft Module based upon the ONIX International 
+            Code Lists Issue 2 (December 2003)
+
+-->
+<xs:schema xmlns:xs="http://www.w3.org/2001/XMLSchema">
+	<xs:simpleType name="List1">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 1">Notification or update type code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Early notification</xs:documentation>
+					<xs:documentation>Use for a complete record issued earlier than approximately six months before publication.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Advance notification (confirmed)</xs:documentation>
+					<xs:documentation>Use for a complete record issued to confirm advance information approximately six months before publication; or for a complete record issued after that date and before information has been confirmed from the book-in-hand.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>Notification confirmed from book-in-hand</xs:documentation>
+					<xs:documentation>Use for a complete record issued to confirm advance information using the book-in-hand at or just before actual publication date; or for a complete record issued at any later date.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Update (partial)</xs:documentation>
+					<xs:documentation>Intended to be used for an update to a part of the record which is sent without re-issuing the complete record. In practise, however, ONIX updating is invariably by complete record replacement using code 03, and code 04 is not used.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>Delete</xs:documentation>
+					<xs:documentation>Use when sending an instruction to delete a record which was previously issued. Note that a delete instruction should NOT be used when a product is cancelled, put out of print, or otherwise withdrawn from sale: this should be handled as a change of availability status, leaving the receiver to decide whether to retain or delete the record. A delete instruction is only used when there is a particular reason to withdraw a record completely, eg because it was issued in error.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="08">
+				<xs:annotation>
+					<xs:documentation>Notice of sale</xs:documentation>
+					<xs:documentation>Notice of sale of a product, from one publisher to another: sent by the publisher disposing of the product</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="09">
+				<xs:annotation>
+					<xs:documentation>Notice of acquisition</xs:documentation>
+					<xs:documentation>Notice of acquisition of a product, by one publisher from another: sent by the acquiring publisher</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List2">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 2">Reason for deletion code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string"/>
+	</xs:simpleType>
+	<xs:simpleType name="List3">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 3">Record source type code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="00">
+				<xs:annotation>
+					<xs:documentation>Unspecified</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Publisher</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Publisher's distributor</xs:documentation>
+					<xs:documentation>Use to designate a distributor providing warehousing and fulfilment for a publisher or for a publisher’s sales agent, as distinct from a wholesaler</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>Wholesaler</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Bibliographic agency</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>Library bookseller</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>Publisher’s sales agent</xs:documentation>
+					<xs:documentation>Use for a publisher’s sales agent responsible for marketing the publisher’s products within a territory, as opposed to a publisher’s distributor who fulfils orders but does not market</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List5">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 5">Product identifier type code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Proprietary</xs:documentation>
+					<xs:documentation>For example, a publisher’s or wholesaler’s product number.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>ISBN-10</xs:documentation>
+					<xs:documentation>International Standard Book Number, pre-2007, unhyphenated (10 characters)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>EAN.UCC-13</xs:documentation>
+					<xs:documentation>EAN-UCC article number (13 digits)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>UPC</xs:documentation>
+					<xs:documentation>UPC product number (12 digits)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>ISMN</xs:documentation>
+					<xs:documentation>International Standard Music Number (10 digits)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>DOI</xs:documentation>
+					<xs:documentation>Digital Object Identifier (variable length and character set)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="13">
+				<xs:annotation>
+					<xs:documentation>LCCN</xs:documentation>
+					<xs:documentation>Library of Congress Control Number (12 characters, alphanumeric)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="14">
+				<xs:annotation>
+					<xs:documentation>GTIN-14</xs:documentation>
+					<xs:documentation>EAN-UCC Global Trade Item Number (14 digits)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="15">
+				<xs:annotation>
+					<xs:documentation>ISBN-13</xs:documentation>
+					<xs:documentation>International Standard Book Number, from 2007, unhyphenated (13 digits)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List6">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 6">Barcode indicator</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="00">
+				<xs:annotation>
+					<xs:documentation>Not barcoded</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Barcoded, scheme unspecified</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>EAN13</xs:documentation>
+					<xs:documentation>Position unspecified</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>EAN13+5</xs:documentation>
+					<xs:documentation>Position unspecified</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>UPC12</xs:documentation>
+					<xs:documentation>Type and position unspecified. DEPRECATED: if possible, use more specific values below.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>UPC12+5</xs:documentation>
+					<xs:documentation>Type and position unspecified. DEPRECATED: if possible, use more specific values below.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>UPC12 (item-specific)</xs:documentation>
+					<xs:documentation>AKA item/price: position unspecified</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="07">
+				<xs:annotation>
+					<xs:documentation>UPC12+5 (item-specific)</xs:documentation>
+					<xs:documentation>AKA item/price: position unspecified</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="08">
+				<xs:annotation>
+					<xs:documentation>UPC12 (price-point)</xs:documentation>
+					<xs:documentation>AKA price/item: position unspecified</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="09">
+				<xs:annotation>
+					<xs:documentation>UPC12+5 (price-point)</xs:documentation>
+					<xs:documentation>AKA price/item: position unspecified</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="10">
+				<xs:annotation>
+					<xs:documentation>EAN13 on cover 4</xs:documentation>
+					<xs:documentation>‘Cover 4’ is defined as the back cover of a book</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="11">
+				<xs:annotation>
+					<xs:documentation>EAN13+5 on cover 4</xs:documentation>
+					<xs:documentation>‘Cover 4’ is defined as the back cover of a book</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="12">
+				<xs:annotation>
+					<xs:documentation>UPC12 (item-specific) on cover 4</xs:documentation>
+					<xs:documentation>AKA item/price; 'cover 4' is defined as the back cover of a book</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="13">
+				<xs:annotation>
+					<xs:documentation>UPC12+5 (item-specific) on cover 4</xs:documentation>
+					<xs:documentation>AKA item/price; 'cover 4' is defined as the back cover of a book</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="14">
+				<xs:annotation>
+					<xs:documentation>UPC12 (price-point) on cover 4</xs:documentation>
+					<xs:documentation>AKA price/item; 'cover 4' is defined as the back cover of a book</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="15">
+				<xs:annotation>
+					<xs:documentation>UPC12+5 (price-point) on cover 4</xs:documentation>
+					<xs:documentation>AKA price/item; 'cover 4' is defined as the back cover of a book</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="16">
+				<xs:annotation>
+					<xs:documentation>EAN13 on cover 3</xs:documentation>
+					<xs:documentation>‘Cover 3’ is defined as the inside back cover of a book</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="17">
+				<xs:annotation>
+					<xs:documentation>EAN13+5 on cover 3</xs:documentation>
+					<xs:documentation>‘Cover 3’ is defined as the inside back cover of a book</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="18">
+				<xs:annotation>
+					<xs:documentation>UPC12 (item-specific) on cover 3</xs:documentation>
+					<xs:documentation>AKA item/price; 'cover 3' is defined as the inside back cover of a book</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="19">
+				<xs:annotation>
+					<xs:documentation>UPC12+5 (item-specific) on cover 3</xs:documentation>
+					<xs:documentation>AKA item/price; 'cover 3' is defined as the inside back cover of a book</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="20">
+				<xs:annotation>
+					<xs:documentation>UPC12 (price-point) on cover 3</xs:documentation>
+					<xs:documentation>AKA price/item; 'cover 3' is defined as the inside back cover of a book</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="21">
+				<xs:annotation>
+					<xs:documentation>UPC12+5 (price-point) on cover 3</xs:documentation>
+					<xs:documentation>AKA price/item; 'cover 3' is defined as the inside back cover of a book</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="22">
+				<xs:annotation>
+					<xs:documentation>EAN13 on cover 2</xs:documentation>
+					<xs:documentation>‘Cover 2’ is defined as the inside front cover of a book</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="23">
+				<xs:annotation>
+					<xs:documentation>EAN13+5 on cover 2</xs:documentation>
+					<xs:documentation>‘Cover 2’ is defined as the inside front cover of a book</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="24">
+				<xs:annotation>
+					<xs:documentation>UPC12 (item-specific) on cover 2</xs:documentation>
+					<xs:documentation>AKA item/price; 'cover 2' is defined as the inside front cover of a book</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="25">
+				<xs:annotation>
+					<xs:documentation>UPC12+5 (item-specific) on cover 2</xs:documentation>
+					<xs:documentation>AKA item/price; 'cover 2' is defined as the inside front cover of a book</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="26">
+				<xs:annotation>
+					<xs:documentation>UPC12 (price-point) on cover 2</xs:documentation>
+					<xs:documentation>AKA price/item; 'cover 2' is defined as the inside front cover of a book</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="27">
+				<xs:annotation>
+					<xs:documentation>UPC12+5 (price-point) on cover 2</xs:documentation>
+					<xs:documentation>AKA price/item; 'cover 2' is defined as the inside front cover of a book</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="28">
+				<xs:annotation>
+					<xs:documentation>EAN13 on box</xs:documentation>
+					<xs:documentation>To be used only on boxed products</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="29">
+				<xs:annotation>
+					<xs:documentation>EAN13+5 on box</xs:documentation>
+					<xs:documentation>To be used only on boxed products</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="30">
+				<xs:annotation>
+					<xs:documentation>UPC12 (item-specific) on box</xs:documentation>
+					<xs:documentation>AKA item/price; to be used only on boxed products</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="31">
+				<xs:annotation>
+					<xs:documentation>UPC12+5 (item-specific) on box</xs:documentation>
+					<xs:documentation>AKA item/price; to be used only on boxed products</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="32">
+				<xs:annotation>
+					<xs:documentation>UPC12 (price-point) on box</xs:documentation>
+					<xs:documentation>AKA price/item; to be used only on boxed products</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="33">
+				<xs:annotation>
+					<xs:documentation>UPC12+5 (price-point) on box</xs:documentation>
+					<xs:documentation>AKA price/item; to be used only on boxed products</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="34">
+				<xs:annotation>
+					<xs:documentation>EAN13 on tag</xs:documentation>
+					<xs:documentation>To be used only on products fitted with hanging tags</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="35">
+				<xs:annotation>
+					<xs:documentation>EAN13+5 on tag</xs:documentation>
+					<xs:documentation>To be used only on products fitted with hanging tags</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="36">
+				<xs:annotation>
+					<xs:documentation>UPC12 (item-specific) on tag</xs:documentation>
+					<xs:documentation>AKA item/price; to be used only on products fitted with hanging tags</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="37">
+				<xs:annotation>
+					<xs:documentation>UPC12+5 (item-specific) on tag</xs:documentation>
+					<xs:documentation>AKA item/price; to be used only on products fitted with hanging tags</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="38">
+				<xs:annotation>
+					<xs:documentation>UPC12 (price-point) on tag</xs:documentation>
+					<xs:documentation>AKA price/item; to be used only on products fitted with hanging tags</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="39">
+				<xs:annotation>
+					<xs:documentation>UPC12+5 (price-point) on tag</xs:documentation>
+					<xs:documentation>AKA price/item; to be used only on products fitted with hanging tags</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="40">
+				<xs:annotation>
+					<xs:documentation>EAN13 on bottom</xs:documentation>
+					<xs:documentation>Not be used on books unless they are contained within outer packaging</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="41">
+				<xs:annotation>
+					<xs:documentation>EAN13+5 on bottom</xs:documentation>
+					<xs:documentation>Not be used on books unless they are contained within outer packaging</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="42">
+				<xs:annotation>
+					<xs:documentation>UPC12 (item-specific) on bottom</xs:documentation>
+					<xs:documentation>AKA item/price; not be used on books unless they are contained within outer packaging</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="43">
+				<xs:annotation>
+					<xs:documentation>UPC12+5 (item-specific) on bottom</xs:documentation>
+					<xs:documentation>AKA item/price; not be used on books unless they are contained within outer packaging</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="44">
+				<xs:annotation>
+					<xs:documentation>UPC12 (price-point) on bottom</xs:documentation>
+					<xs:documentation>AKA price/item; not be used on books unless they are contained within outer packaging</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="45">
+				<xs:annotation>
+					<xs:documentation>UPC12+5 (price-point) on bottom</xs:documentation>
+					<xs:documentation>AKA price/item; not be used on books unless they are contained within outer packaging</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="46">
+				<xs:annotation>
+					<xs:documentation>EAN13 on back</xs:documentation>
+					<xs:documentation>Not be used on books unless they are contained within outer packaging</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="47">
+				<xs:annotation>
+					<xs:documentation>EAN13+5 on back</xs:documentation>
+					<xs:documentation>Not be used on books unless they are contained within outer packaging</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="48">
+				<xs:annotation>
+					<xs:documentation>UPC12 (item-specific) on back</xs:documentation>
+					<xs:documentation>AKA item/price; not be used on books unless they are contained within outer packaging</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="49">
+				<xs:annotation>
+					<xs:documentation>UPC12+5 (item-specific) on back</xs:documentation>
+					<xs:documentation>AKA item/price; not be used on books unless they are contained within outer packaging</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="50">
+				<xs:annotation>
+					<xs:documentation>UPC12 (price-point) on back</xs:documentation>
+					<xs:documentation>AKA price/item; not be used on books unless they are contained within outer packaging</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="51">
+				<xs:annotation>
+					<xs:documentation>UPC12+5 (price-point) on back</xs:documentation>
+					<xs:documentation>AKA price/item; not be used on books unless they are contained within outer packaging</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="52">
+				<xs:annotation>
+					<xs:documentation>EAN13 on outer sleeve/back</xs:documentation>
+					<xs:documentation>To be used only on products packaged in outer sleeves</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="53">
+				<xs:annotation>
+					<xs:documentation>EAN13+5 on outer sleeve/back</xs:documentation>
+					<xs:documentation>To be used only on products packaged in outer sleeves</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="54">
+				<xs:annotation>
+					<xs:documentation>UPC12 (item-specific) on outer sleeve/back</xs:documentation>
+					<xs:documentation>AKA item/price; to be used only on products packaged in outer sleeves</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="55">
+				<xs:annotation>
+					<xs:documentation>UPC12+5 (item-specific) on outer sleeve/back</xs:documentation>
+					<xs:documentation>AKA item/price; to be used only on products packaged in outer sleeves</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="56">
+				<xs:annotation>
+					<xs:documentation>UPC12 (price-point) on outer sleeve/back</xs:documentation>
+					<xs:documentation>AKA price/item; to be used only on products packaged in outer sleeves</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="57">
+				<xs:annotation>
+					<xs:documentation>UPC12+5 (price-point) on outer sleeve/back</xs:documentation>
+					<xs:documentation>AKA price/item; to be used only on products packaged in outer sleeves</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List7">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 7">Product form code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="00">
+				<xs:annotation>
+					<xs:documentation>Undefined</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AA">
+				<xs:annotation>
+					<xs:documentation>Audio</xs:documentation>
+					<xs:documentation>Audio recording - detail unspecified</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AB">
+				<xs:annotation>
+					<xs:documentation>Audio cassette</xs:documentation>
+					<xs:documentation>Audio cassette (analogue)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AC">
+				<xs:annotation>
+					<xs:documentation>CD-Audio</xs:documentation>
+					<xs:documentation>Audio compact disk, in CD-Audio or SACD format</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AD">
+				<xs:annotation>
+					<xs:documentation>DAT</xs:documentation>
+					<xs:documentation>Digital audio tape cassette</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AE">
+				<xs:annotation>
+					<xs:documentation>Audio disk</xs:documentation>
+					<xs:documentation>Audio disk (excluding CD)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AF">
+				<xs:annotation>
+					<xs:documentation>Audio tape</xs:documentation>
+					<xs:documentation>Audio tape (reel tape)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AG">
+				<xs:annotation>
+					<xs:documentation>MiniDisc</xs:documentation>
+					<xs:documentation>Sony MiniDisc format</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AH">
+				<xs:annotation>
+					<xs:documentation>CD-Extra</xs:documentation>
+					<xs:documentation>Audio compact disk with part CD-ROM content</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AI">
+				<xs:annotation>
+					<xs:documentation>DVD Audio</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AJ">
+				<xs:annotation>
+					<xs:documentation>Downloadable audio file</xs:documentation>
+					<xs:documentation>Audio recording downloadable online</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AZ">
+				<xs:annotation>
+					<xs:documentation>Other audio format</xs:documentation>
+					<xs:documentation>Other audio format not specified by AB to AJ</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BA">
+				<xs:annotation>
+					<xs:documentation>Book</xs:documentation>
+					<xs:documentation>Book - detail unspecified</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BB">
+				<xs:annotation>
+					<xs:documentation>Hardback</xs:documentation>
+					<xs:documentation>Hardback or cased book</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BC">
+				<xs:annotation>
+					<xs:documentation>Paperback</xs:documentation>
+					<xs:documentation>Paperback or softback book</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BD">
+				<xs:annotation>
+					<xs:documentation>Loose-leaf</xs:documentation>
+					<xs:documentation>Loose-leaf book</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BE">
+				<xs:annotation>
+					<xs:documentation>Spiral bound</xs:documentation>
+					<xs:documentation>Spiral, comb or coil bound book</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BF">
+				<xs:annotation>
+					<xs:documentation>Pamphlet</xs:documentation>
+					<xs:documentation>Pamphlet or brochure, stapled; German 'geheftet'</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BG">
+				<xs:annotation>
+					<xs:documentation>Leather / fine binding</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BH">
+				<xs:annotation>
+					<xs:documentation>Board book</xs:documentation>
+					<xs:documentation>Child’s book with all pages printed on board</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BI">
+				<xs:annotation>
+					<xs:documentation>Rag book</xs:documentation>
+					<xs:documentation>Child’s book with all pages printed on textile</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BJ">
+				<xs:annotation>
+					<xs:documentation>Bath book</xs:documentation>
+					<xs:documentation>Child’s book printed on waterproof material</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BK">
+				<xs:annotation>
+					<xs:documentation>Novelty book</xs:documentation>
+					<xs:documentation>Use for books whose novelty is expressed in the format itself, not for books in a conventional format which happen to have novelty content</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BL">
+				<xs:annotation>
+					<xs:documentation>Slide bound</xs:documentation>
+					<xs:documentation>Slide bound book</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BM">
+				<xs:annotation>
+					<xs:documentation>Big book</xs:documentation>
+					<xs:documentation>Extra-large format for teaching etc; this format and terminology may be specifically UK; required as a top-level differentiator</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BN">
+				<xs:annotation>
+					<xs:documentation>Part-work (fascículo)</xs:documentation>
+					<xs:documentation>A part-work issued with its own ISBN and intended to be collected and bound into a complete book</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BO">
+				<xs:annotation>
+					<xs:documentation>Leporello (folded)</xs:documentation>
+					<xs:documentation>A concertina-folded book, usually a picture book</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BZ">
+				<xs:annotation>
+					<xs:documentation>Other book format</xs:documentation>
+					<xs:documentation>Other book format or binding not specified by BB to BO</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CA">
+				<xs:annotation>
+					<xs:documentation>Sheet map</xs:documentation>
+					<xs:documentation>Sheet map - detail unspecified</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CB">
+				<xs:annotation>
+					<xs:documentation>Sheet map, folded</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CC">
+				<xs:annotation>
+					<xs:documentation>Sheet map, flat</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CD">
+				<xs:annotation>
+					<xs:documentation>Sheet map, rolled</xs:documentation>
+					<xs:documentation>See Code List 80 for 'rolled in tube'</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CE">
+				<xs:annotation>
+					<xs:documentation>Globe</xs:documentation>
+					<xs:documentation>Globe or planisphere</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CZ">
+				<xs:annotation>
+					<xs:documentation>Other cartographic</xs:documentation>
+					<xs:documentation>Other cartographic format not specified by CB to CE</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="DA">
+				<xs:annotation>
+					<xs:documentation>Digital</xs:documentation>
+					<xs:documentation>Digital or multimedia (detail unspecified)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="DB">
+				<xs:annotation>
+					<xs:documentation>CD-ROM</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="DC">
+				<xs:annotation>
+					<xs:documentation>CD-I</xs:documentation>
+					<xs:documentation>CD interactive</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="DD">
+				<xs:annotation>
+					<xs:documentation>DVD</xs:documentation>
+					<xs:documentation>Digital Versatile Disk: DEPRECATED - use VI for DVD video, AI for DVD audio, DI for DVD-ROM</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="DE">
+				<xs:annotation>
+					<xs:documentation>Game cartridge</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="DF">
+				<xs:annotation>
+					<xs:documentation>Diskette</xs:documentation>
+					<xs:documentation>AKA 'floppy disk'</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="DG">
+				<xs:annotation>
+					<xs:documentation>Electronic book text</xs:documentation>
+					<xs:documentation>Electronic book text in proprietary or open standard format</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="DH">
+				<xs:annotation>
+					<xs:documentation>Online resource</xs:documentation>
+					<xs:documentation>An electronic database or other resource or service accessible through online networks</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="DI">
+				<xs:annotation>
+					<xs:documentation>DVD-ROM</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="DJ">
+				<xs:annotation>
+					<xs:documentation>Secure Digital (SD) Memory Card</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="DK">
+				<xs:annotation>
+					<xs:documentation>Compact Flash Memory Card</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="DL">
+				<xs:annotation>
+					<xs:documentation>Memory Stick Memory Card</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="DM">
+				<xs:annotation>
+					<xs:documentation>USB Flash Drive</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="DZ">
+				<xs:annotation>
+					<xs:documentation>Other digital</xs:documentation>
+					<xs:documentation>Other digital or multimedia not specified by DB to DM</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="FA">
+				<xs:annotation>
+					<xs:documentation>Film or transparency</xs:documentation>
+					<xs:documentation>Film or transparency – detail unspecified</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="FB">
+				<xs:annotation>
+					<xs:documentation>Film</xs:documentation>
+					<xs:documentation>Continuous film or filmstrip: DEPRECATED - use FE or FF</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="FC">
+				<xs:annotation>
+					<xs:documentation>Slides</xs:documentation>
+					<xs:documentation>Photographic transparencies mounted for projection</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="FD">
+				<xs:annotation>
+					<xs:documentation>OHP transparencies</xs:documentation>
+					<xs:documentation>Transparencies for overhead projector</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="FE">
+				<xs:annotation>
+					<xs:documentation>Filmstrip</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="FF">
+				<xs:annotation>
+					<xs:documentation>Film</xs:documentation>
+					<xs:documentation>Continuous movie film as opposed to filmstrip</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="FZ">
+				<xs:annotation>
+					<xs:documentation>Other film or transparency format</xs:documentation>
+					<xs:documentation>Other film or transparency format not specified by FB to FF</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MA">
+				<xs:annotation>
+					<xs:documentation>Microform</xs:documentation>
+					<xs:documentation>Microform – detail unspecified</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MB">
+				<xs:annotation>
+					<xs:documentation>Microfiche</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MC">
+				<xs:annotation>
+					<xs:documentation>Microfilm</xs:documentation>
+					<xs:documentation>Roll microfilm</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MZ">
+				<xs:annotation>
+					<xs:documentation>Other microform</xs:documentation>
+					<xs:documentation>Other microform not specified by MB or MC</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PA">
+				<xs:annotation>
+					<xs:documentation>Miscellaneous print</xs:documentation>
+					<xs:documentation>Miscellaneous printed material – detail unspecified</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PB">
+				<xs:annotation>
+					<xs:documentation>Address book</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PC">
+				<xs:annotation>
+					<xs:documentation>Calendar</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PD">
+				<xs:annotation>
+					<xs:documentation>Cards</xs:documentation>
+					<xs:documentation>Cards, flash cards (eg for teaching reading)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PE">
+				<xs:annotation>
+					<xs:documentation>Copymasters</xs:documentation>
+					<xs:documentation>Copymasters, photocopiable sheets</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PF">
+				<xs:annotation>
+					<xs:documentation>Diary</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PG">
+				<xs:annotation>
+					<xs:documentation>Frieze</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PH">
+				<xs:annotation>
+					<xs:documentation>Kit</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PI">
+				<xs:annotation>
+					<xs:documentation>Sheet music</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PJ">
+				<xs:annotation>
+					<xs:documentation>Postcard book or pack</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PK">
+				<xs:annotation>
+					<xs:documentation>Poster</xs:documentation>
+					<xs:documentation>Poster for retail sale – see also XF</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PL">
+				<xs:annotation>
+					<xs:documentation>Record book</xs:documentation>
+					<xs:documentation>Record book (eg 'birthday book', 'baby book')</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PM">
+				<xs:annotation>
+					<xs:documentation>Wallet or folder</xs:documentation>
+					<xs:documentation>Wallet or folder (containing loose sheets etc): it is preferable to code the contents and treat 'wallet' as packaging (List 80), but if this is not possible the product as a whole may be coded as a 'wallet'</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PN">
+				<xs:annotation>
+					<xs:documentation>Pictures or photographs</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PO">
+				<xs:annotation>
+					<xs:documentation>Wallchart</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PP">
+				<xs:annotation>
+					<xs:documentation>Stickers</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PQ">
+				<xs:annotation>
+					<xs:documentation>Plate (lámina)</xs:documentation>
+					<xs:documentation>A book-sized (as opposed to poster-sized) sheet, usually in colour or high quality print</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PZ">
+				<xs:annotation>
+					<xs:documentation>Other printed item</xs:documentation>
+					<xs:documentation>Other printed item not specified by PB to PQ</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="VA">
+				<xs:annotation>
+					<xs:documentation>Video</xs:documentation>
+					<xs:documentation>Video – detail unspecified</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="VB">
+				<xs:annotation>
+					<xs:documentation>Video, VHS, PAL</xs:documentation>
+					<xs:documentation>DEPRECATED - use new VJ</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="VC">
+				<xs:annotation>
+					<xs:documentation>Video, VHS, NTSC</xs:documentation>
+					<xs:documentation>DEPRECATED - use new VJ</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="VD">
+				<xs:annotation>
+					<xs:documentation>Video, Betamax, PAL</xs:documentation>
+					<xs:documentation>DEPRECATED - use new VK</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="VE">
+				<xs:annotation>
+					<xs:documentation>Video, Betamax, NTSC</xs:documentation>
+					<xs:documentation>DEPRECATED - use new VK</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="VF">
+				<xs:annotation>
+					<xs:documentation>Videodisk</xs:documentation>
+					<xs:documentation>eg Laserdisk</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="VG">
+				<xs:annotation>
+					<xs:documentation>Video, VHS, SECAM</xs:documentation>
+					<xs:documentation>DEPRECATED - use new VJ</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="VH">
+				<xs:annotation>
+					<xs:documentation>Video, Betamax, SECAM</xs:documentation>
+					<xs:documentation>DEPRECATED - use new VK</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="VI">
+				<xs:annotation>
+					<xs:documentation>DVD video</xs:documentation>
+					<xs:documentation>DVD video: specify TV standard in List 78</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="VJ">
+				<xs:annotation>
+					<xs:documentation>VHS video</xs:documentation>
+					<xs:documentation>VHS videotape: specify TV standard in List 78</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="VK">
+				<xs:annotation>
+					<xs:documentation>Betamax video</xs:documentation>
+					<xs:documentation>Betamax videotape: specify TV standard in List 78</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="VL">
+				<xs:annotation>
+					<xs:documentation>VCD</xs:documentation>
+					<xs:documentation>VideoCD</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="VM">
+				<xs:annotation>
+					<xs:documentation>SVCD</xs:documentation>
+					<xs:documentation>Super VideoCD</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="VZ">
+				<xs:annotation>
+					<xs:documentation>Other video format</xs:documentation>
+					<xs:documentation>Other video format not specified by VB to VK</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="WW">
+				<xs:annotation>
+					<xs:documentation>Mixed media product</xs:documentation>
+					<xs:documentation>A product consisting of two or more items in different media, eg book and CD-ROM, book and toy etc</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="WX">
+				<xs:annotation>
+					<xs:documentation>Quantity pack</xs:documentation>
+					<xs:documentation>A product consisting of (a) a quantity of a single item, or (b) quantities of two or more separate items, packaged together for retail sale, eg a quantity pack of classroom texts, not to be confused with packs intended for trade distribution only – see XC, XE, XL</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="XA">
+				<xs:annotation>
+					<xs:documentation>Trade-only material</xs:documentation>
+					<xs:documentation>Trade-only material (unspecified)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="XB">
+				<xs:annotation>
+					<xs:documentation>Dumpbin – empty</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="XC">
+				<xs:annotation>
+					<xs:documentation>Dumpbin – filled</xs:documentation>
+					<xs:documentation>Dumpbin with contents</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="XD">
+				<xs:annotation>
+					<xs:documentation>Counterpack – empty</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="XE">
+				<xs:annotation>
+					<xs:documentation>Counterpack – filled</xs:documentation>
+					<xs:documentation>Counterpack with contents</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="XF">
+				<xs:annotation>
+					<xs:documentation>Poster, promotional</xs:documentation>
+					<xs:documentation>Promotional poster for display, not for sale – see also PK</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="XG">
+				<xs:annotation>
+					<xs:documentation>Shelf strip</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="XH">
+				<xs:annotation>
+					<xs:documentation>Window piece</xs:documentation>
+					<xs:documentation>Promotional piece for shop window display</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="XI">
+				<xs:annotation>
+					<xs:documentation>Streamer</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="XJ">
+				<xs:annotation>
+					<xs:documentation>Spinner</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="XK">
+				<xs:annotation>
+					<xs:documentation>Large book display</xs:documentation>
+					<xs:documentation>Large scale facsimile of book for promotional display</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="XL">
+				<xs:annotation>
+					<xs:documentation>Shrink-wrapped pack</xs:documentation>
+					<xs:documentation>A quantity pack with its own product code, for trade supply only: the retail items it contains are intended for sale individually – see also WX</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="XZ">
+				<xs:annotation>
+					<xs:documentation>Other point of sale</xs:documentation>
+					<xs:documentation>Other point of sale material not specified by XB to XL</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ZA">
+				<xs:annotation>
+					<xs:documentation>General merchandise</xs:documentation>
+					<xs:documentation>General merchandise – unspecified</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ZB">
+				<xs:annotation>
+					<xs:documentation>Doll</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ZC">
+				<xs:annotation>
+					<xs:documentation>Soft toy</xs:documentation>
+					<xs:documentation>Soft or plush toy</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ZD">
+				<xs:annotation>
+					<xs:documentation>Toy</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ZE">
+				<xs:annotation>
+					<xs:documentation>Game</xs:documentation>
+					<xs:documentation>Board game, or other game (except computer game: see DE)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ZF">
+				<xs:annotation>
+					<xs:documentation>T-shirt</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ZZ">
+				<xs:annotation>
+					<xs:documentation>Other merchandize</xs:documentation>
+					<xs:documentation>Other merchandize not specified by ZB to ZF</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List8">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 8">Book form detail</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>A-format paperback</xs:documentation>
+					<xs:documentation>DEPRECATED</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>B-format paperback</xs:documentation>
+					<xs:documentation>‘B’ format paperback: UK 198 x 129 mm - DEPRECATED</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>C-format paperback</xs:documentation>
+					<xs:documentation>‘C’ format paperback: UK 216 x 135 mm - DEPRECATED</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Paper over boards</xs:documentation>
+					<xs:documentation>DEPRECATED</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>Cloth</xs:documentation>
+					<xs:documentation>DEPRECATED</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>With dust jacket</xs:documentation>
+					<xs:documentation>DEPRECATED</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="07">
+				<xs:annotation>
+					<xs:documentation>Reinforced binding</xs:documentation>
+					<xs:documentation>DEPRECATED</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List9">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 9">Product classification type code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>WCO Harmonized System</xs:documentation>
+					<xs:documentation>World Customs Organization Harmonized Commodity Coding &amp; Description System</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>UNSPSC</xs:documentation>
+					<xs:documentation>UN Standard Product &amp; Service Classification</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>HMC&amp;E</xs:documentation>
+					<xs:documentation>UK Customs &amp; Excise classifications, based on the Harmonized System</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Warenverzeichnis für die Außenhandelsstatistik</xs:documentation>
+					<xs:documentation>German export trade classification, based on the Harmonised System</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>TARIC</xs:documentation>
+					<xs:documentation>EU TARIC codes, an extended version of the Harmonized System</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List10">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 10">Epublication type code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="000">
+				<xs:annotation>
+					<xs:documentation>Epublication “content package”</xs:documentation>
+					<xs:documentation>An epublication viewed as a unique package of content which may be converted into any of a number of different types for delivery to the consumer. This code is used when an ONIX &lt;Product&gt; record describes the content package and lists within the record the different forms in which it is available.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="001">
+				<xs:annotation>
+					<xs:documentation>HTML</xs:documentation>
+					<xs:documentation>An epublication delivered in a basic, unprotected, HTML format. Do NOT use for HTML-based formats which include DRM protection.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="002">
+				<xs:annotation>
+					<xs:documentation>PDF</xs:documentation>
+					<xs:documentation>An epublication delivered in a basic, unprotected, PDF format. Do NOT use for PDF-based formats which include DRM protection.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="003">
+				<xs:annotation>
+					<xs:documentation>PDF-Merchant</xs:documentation>
+					<xs:documentation>An epublication delivered in PDF format, capable of being read in the standard Acrobat Reader, and protected by PDF-Merchant DRM features. (This format is no longer supported for new applications.)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="004">
+				<xs:annotation>
+					<xs:documentation>Adobe Ebook Reader</xs:documentation>
+					<xs:documentation>An epublication delivered in an enhanced PDF format, using Adobe’s proprietary EBX DRM, capable of being read in the Adobe Ebook Reader software, on any platform which can support this software, which was formerly known as Glassbook.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="005">
+				<xs:annotation>
+					<xs:documentation>Microsoft Reader Level 1/Level 3</xs:documentation>
+					<xs:documentation>An epublication delivered in an unencrypted Microsoft .LIT format, capable of being read in the Microsoft Reader software at any level, on any platform which can support this software. (Level 3 differs from Level 1 only in that it embeds the name of the original purchaser.)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="006">
+				<xs:annotation>
+					<xs:documentation>Microsoft Reader Level 5</xs:documentation>
+					<xs:documentation>An epublication delivered in the Microsoft .LIT format, with full encryption, capable of being read in the Microsoft Reader software at Level 5, on any platform which can support this software.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="007">
+				<xs:annotation>
+					<xs:documentation>NetLibrary</xs:documentation>
+					<xs:documentation>An epublication delivered in a proprietary HTML- or OEBF-based format, capable of being read only through subscription to the NetLibrary service.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="008">
+				<xs:annotation>
+					<xs:documentation>MetaText</xs:documentation>
+					<xs:documentation>An epublication delivered in a proprietary format through a web browser, capable of being read only through subscription to the MetaText service (the educational division of NetLibrary)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="009">
+				<xs:annotation>
+					<xs:documentation>MightyWords</xs:documentation>
+					<xs:documentation>An epublication delivered in a proprietary PDF-based format, capable of being read only through subscription to the MightyWords service.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="010">
+				<xs:annotation>
+					<xs:documentation>Palm Reader</xs:documentation>
+					<xs:documentation>An epublication delivered in a proprietary HTML-based format, capable of being read in reading software which may be used on handheld devices using the Palm OS or Pocket PC/Windows CE operating systems.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="011">
+				<xs:annotation>
+					<xs:documentation>Softbook</xs:documentation>
+					<xs:documentation>An epublication delivered in a proprietary format capable of being read in reading software which is specific to the Softbook hardware platform. Also capable of being read on the Softbook’s successor, the Gemstar REB 1200.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="012">
+				<xs:annotation>
+					<xs:documentation>RocketBook</xs:documentation>
+					<xs:documentation>An epublication delivered in a proprietary .RB format, capable of being read in reading software which is specific to the RocketBook hardware platform. Also capable of being read on the RocketBook’s successor, the Gemstar REB 1100.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="013">
+				<xs:annotation>
+					<xs:documentation>Gemstar REB 1100</xs:documentation>
+					<xs:documentation>An epublication delivered in a proprietary .RB format, capable of being read in reading software which is specific to the Gemstar REB 1100 hardware platform. Also capable of being read on the RocketBook with some loss of functionality.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="014">
+				<xs:annotation>
+					<xs:documentation>Gemstar REB 1200</xs:documentation>
+					<xs:documentation>An epublication delivered in a proprietary format, capable of being read in reading software which is specific to the Gemstar REB 1200 hardware platform. Also capable of being read on the Softbook with some loss of functionality.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="015">
+				<xs:annotation>
+					<xs:documentation>Franklin eBookman</xs:documentation>
+					<xs:documentation>An epublication delivered in Franklin’s proprietary HTML-based format, capable of being read in reading software which is specific to the Franklin eBookman platform.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="016">
+				<xs:annotation>
+					<xs:documentation>Books24x7</xs:documentation>
+					<xs:documentation>An epublication delivered in a proprietary XML-based format and available for online access only through subscription to the Books24x7 service.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="017">
+				<xs:annotation>
+					<xs:documentation>DigitalOwl</xs:documentation>
+					<xs:documentation>An epublication available through DigitalOwl proprietary packaging, distribution and DRM software, delivered in a variety of formats across a range of platforms.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="018">
+				<xs:annotation>
+					<xs:documentation>Handheldmed</xs:documentation>
+					<xs:documentation>An epublication delivered in a proprietary HTML-based format, capable of being read in Handheldmed reader software on Palm OS, Windows, and EPOC/Psion handheld devices, available only through the Handheldmed service.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="019">
+				<xs:annotation>
+					<xs:documentation>WizeUp</xs:documentation>
+					<xs:documentation>An epublication delivered in a proprietary ???-based format and available for download only through the WizeUp service.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="020">
+				<xs:annotation>
+					<xs:documentation>TK3</xs:documentation>
+					<xs:documentation>An epublication delivered in the proprietary TK3 format, capable of being read only in the TK3 reader software supplied by Night Kitchen Inc, on any platform which can support this software.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="021">
+				<xs:annotation>
+					<xs:documentation>Litraweb</xs:documentation>
+					<xs:documentation>An epublication delivered in an encrypted .RTF format, capable of being read only in the Litraweb Visor software, and available only from Litraweb.com.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="022">
+				<xs:annotation>
+					<xs:documentation>MobiPocket</xs:documentation>
+					<xs:documentation>An epublication delivered in a proprietary format, capable of being read in the MobiPocket software on PalmOS, WindowsCE /Pocket PC, Franklin eBookman, and EPOC32 handheld devices, available only through the MobiPocket service.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="023">
+				<xs:annotation>
+					<xs:documentation>Open Ebook</xs:documentation>
+					<xs:documentation>An epublication delivered in the standard distribution format specified in the Open Ebook Publication Structure (OEBPS) format and capable of being read in any OEBPS-compliant reading system.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="024">
+				<xs:annotation>
+					<xs:documentation>Town Compass DataViewer</xs:documentation>
+					<xs:documentation>An epublication delivered in a proprietary format, capable of being read in Town Compass DataViewer reader software on a Palm OS handheld device.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="025">
+				<xs:annotation>
+					<xs:documentation>TXT</xs:documentation>
+					<xs:documentation>An epublication delivered in an openly available .TXT format, with ASCII or UTF-8 encoding, as used for example in Project Gutenberg</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="026">
+				<xs:annotation>
+					<xs:documentation>ExeBook</xs:documentation>
+					<xs:documentation>An epublication delivered as a self-executing file including its own reader software, and created with proprietary ExeBook Self-Publisher software</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="027">
+				<xs:annotation>
+					<xs:documentation>Sony BBeB</xs:documentation>
+					<xs:documentation>An epublication delivered in a proprietary format, capable of being read on a Sony Reader handheld device</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List11">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 11">Epublication format code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>HTML</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>PDF</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>Microsoft Reader</xs:documentation>
+					<xs:documentation>‘.LIT’ file format used by Microsoft Reader software</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>RocketBook</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>Rich text format (RTF)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>Open Ebook Publication Structure (OEBPS) format standard</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="07">
+				<xs:annotation>
+					<xs:documentation>XML</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="08">
+				<xs:annotation>
+					<xs:documentation>SGML</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="09">
+				<xs:annotation>
+					<xs:documentation>EXE</xs:documentation>
+					<xs:documentation>‘.EXE’ file format used when an epublication is delivered as a self-executing package of software and content.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="10">
+				<xs:annotation>
+					<xs:documentation>ASCII</xs:documentation>
+					<xs:documentation>‘.TXT’ file format</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="11">
+				<xs:annotation>
+					<xs:documentation>MobiPocket format</xs:documentation>
+					<xs:documentation>Proprietary file format used for the MobiPocket reader software</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List12">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 12">Trade category code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>UK open market edition</xs:documentation>
+					<xs:documentation>An edition from a UK publisher sold only in territories where exclusive rights are not held. Rights details should be carried in PR.21 as usual.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Airport edition</xs:documentation>
+					<xs:documentation>In UK, an edition intended primarily for airside sales in UK airports, though it may be available for sale in other territories where exclusive rights are not held. Details should be carried in PR.21 as usual.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>Sonderausgabe</xs:documentation>
+					<xs:documentation>In Germany, a special printing sold at a lower price than the regular hardback</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Pocket paperback</xs:documentation>
+					<xs:documentation>In countries where recognised as a distinct trade category, eg France 'livre de poche', Germany 'Taschenbuch', Italy 'tascabile', Spain 'libro de bolsillo</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>International edition (US)</xs:documentation>
+					<xs:documentation>Edition produced solely for sale in designated export markets</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>Library audio edition</xs:documentation>
+					<xs:documentation>Audio product sold in special durable packaging and with a replacement guarantee for the contained cassettes or CDs for a specified shelf-life</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="07">
+				<xs:annotation>
+					<xs:documentation>US open market edition</xs:documentation>
+					<xs:documentation>An edition from a US publisher sold only in territories where exclusive rights are not held. Rights details should be carried in PR.21 as usual.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="08">
+				<xs:annotation>
+					<xs:documentation>Livre scolaire, déclaré par l'éditeur</xs:documentation>
+					<xs:documentation>In France, a category of book that has a particular legal status, claimed by the publisher</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="09">
+				<xs:annotation>
+					<xs:documentation>Livre scolaire (non spécifié)</xs:documentation>
+					<xs:documentation>In France, a category of book that has a particular legal status, designated independently of the publisher</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List13">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 13">Series identifier type code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Proprietary</xs:documentation>
+					<xs:documentation>For example, publisher’s own series ID</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>ISSN</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>German National Bibliography series ID</xs:documentation>
+					<xs:documentation>Maintained by the Deutsche Bibliothek</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>German Books in Print series ID</xs:documentation>
+					<xs:documentation>Maintained by VLB</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>Electre series ID</xs:documentation>
+					<xs:documentation>Maintained by Electre Information, France</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>DOI</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List14">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 14">Text case flag</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="00">
+				<xs:annotation>
+					<xs:documentation>Undefined</xs:documentation>
+					<xs:documentation>Default</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Sentence case</xs:documentation>
+					<xs:documentation>Initial capitals on first word and subsequently on proper names only, eg The conquest of Mexico</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Title case</xs:documentation>
+					<xs:documentation>Initial capitals on first word and on all significant words thereafter, eg The Conquest of Mexico</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>All capitals</xs:documentation>
+					<xs:documentation>For example, THE CONQUEST OF MEXICO</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List15">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 15">Title type code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="00">
+				<xs:annotation>
+					<xs:documentation>Undefined</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Distinctive title(book); cover title (serial)</xs:documentation>
+					<xs:documentation>The full text of the distinctive title of the item, without abbreviation or abridgement. For books, where the title alone is not distinctive, elements may be taken from a set or series title and part number etc to create a distinctive title. Where the item is an omnibus edition containing two or more works by the same author, and there is no separate combined title, a distinctive title may be constructed by concatenating the individual titles, with suitable punctuation, as in Pride and prejudice / Sense and sensibility / Northanger Abbey.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>ISSN key title of serial</xs:documentation>
+					<xs:documentation>Serials only</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>Title in original language</xs:documentation>
+					<xs:documentation>Where the subject of the ONIX record is a translated item</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Title acronym</xs:documentation>
+					<xs:documentation>For serials: JACM = Journal of the Association for Computing Machinery</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>Abbreviated title</xs:documentation>
+					<xs:documentation>An abbreviated form of Title Type 01</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>Title in other language</xs:documentation>
+					<xs:documentation>A translation of Title Type 01 into another language</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="07">
+				<xs:annotation>
+					<xs:documentation>Thematic title of journal issue</xs:documentation>
+					<xs:documentation>Serials only: when a journal issue is explicitly devoted to a specified topic</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="08">
+				<xs:annotation>
+					<xs:documentation>Former title</xs:documentation>
+					<xs:documentation>Books or serials: when an item was previously published under another title</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="10">
+				<xs:annotation>
+					<xs:documentation>Distributor's title</xs:documentation>
+					<xs:documentation>For books: the title carried in a book distributor's title file: frequently incomplete, and may include elements not properly part of the title</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List16">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 16">Work identifier type code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Proprietary</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>ISBN</xs:documentation>
+					<xs:documentation>ISBN of manifestation of work, when this is the only identifier available</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>DOI</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="11">
+				<xs:annotation>
+					<xs:documentation>ISTC</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List17">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 17">Contributor role code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="A01">
+				<xs:annotation>
+					<xs:documentation>By (author)</xs:documentation>
+					<xs:documentation>Author of a textual work</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A02">
+				<xs:annotation>
+					<xs:documentation>With</xs:documentation>
+					<xs:documentation>With or as told to: 'ghost' author of a literary work</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A03">
+				<xs:annotation>
+					<xs:documentation>Screenplay by</xs:documentation>
+					<xs:documentation>Writer of screenplay or script (film or video)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A04">
+				<xs:annotation>
+					<xs:documentation>Libretto by</xs:documentation>
+					<xs:documentation>Writer of libretto (opera): see also A31</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A05">
+				<xs:annotation>
+					<xs:documentation>Lyrics by</xs:documentation>
+					<xs:documentation>Author of lyrics (song): see also A31</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A06">
+				<xs:annotation>
+					<xs:documentation>By (composer)</xs:documentation>
+					<xs:documentation>Composer of music</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A07">
+				<xs:annotation>
+					<xs:documentation>By (artist)</xs:documentation>
+					<xs:documentation>Visual artist when named as the primary creator of, eg, a book of reproductions of artworks</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A08">
+				<xs:annotation>
+					<xs:documentation>By (photographer)</xs:documentation>
+					<xs:documentation>Photographer when named as the primary creator of, eg, a book of photographs)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A09">
+				<xs:annotation>
+					<xs:documentation>Created by</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A10">
+				<xs:annotation>
+					<xs:documentation>From an idea by</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A11">
+				<xs:annotation>
+					<xs:documentation>Designed by</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A12">
+				<xs:annotation>
+					<xs:documentation>Illustrated by</xs:documentation>
+					<xs:documentation>Artist when named as the creator of artwork which illustrates a text, or of the artwork of a graphic novel or comic book</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A13">
+				<xs:annotation>
+					<xs:documentation>Photographs by</xs:documentation>
+					<xs:documentation>Photographer when named as the creator of photographs which illustrate a text</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A14">
+				<xs:annotation>
+					<xs:documentation>Text by</xs:documentation>
+					<xs:documentation>Author of text which accompanies art reproductions or photographs, or which is part of a graphic novel or comic book</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A15">
+				<xs:annotation>
+					<xs:documentation>Preface by</xs:documentation>
+					<xs:documentation>Author of preface</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A16">
+				<xs:annotation>
+					<xs:documentation>Prologue by</xs:documentation>
+					<xs:documentation>Author of prologue</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A17">
+				<xs:annotation>
+					<xs:documentation>Summary by</xs:documentation>
+					<xs:documentation>Author of summary</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A18">
+				<xs:annotation>
+					<xs:documentation>Supplement by</xs:documentation>
+					<xs:documentation>Author of supplement</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A19">
+				<xs:annotation>
+					<xs:documentation>Afterword by</xs:documentation>
+					<xs:documentation>Author of afterword</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A20">
+				<xs:annotation>
+					<xs:documentation>Notes by</xs:documentation>
+					<xs:documentation>Author of notes or annotations: see also A29</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A21">
+				<xs:annotation>
+					<xs:documentation>Commentaries by</xs:documentation>
+					<xs:documentation>Author of commentaries on the main text</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A22">
+				<xs:annotation>
+					<xs:documentation>Epilogue by</xs:documentation>
+					<xs:documentation>Author of epilogue</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A23">
+				<xs:annotation>
+					<xs:documentation>Foreword by</xs:documentation>
+					<xs:documentation>Author of foreword</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A24">
+				<xs:annotation>
+					<xs:documentation>Introduction by</xs:documentation>
+					<xs:documentation>Author of introduction: see also A29</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A25">
+				<xs:annotation>
+					<xs:documentation>Footnotes by</xs:documentation>
+					<xs:documentation>Author/compiler of footnotes</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A26">
+				<xs:annotation>
+					<xs:documentation>Memoir by</xs:documentation>
+					<xs:documentation>Author of memoir accompanying main text</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A27">
+				<xs:annotation>
+					<xs:documentation>Experiments by</xs:documentation>
+					<xs:documentation>Person who carried out experiments reported in the text</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A29">
+				<xs:annotation>
+					<xs:documentation>Introduction and notes by</xs:documentation>
+					<xs:documentation>Author of introduction and notes: see also A20 and A24</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A30">
+				<xs:annotation>
+					<xs:documentation>Software written by</xs:documentation>
+					<xs:documentation>Writer of computer programs ancillary to the text</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A31">
+				<xs:annotation>
+					<xs:documentation>Book and lyrics by</xs:documentation>
+					<xs:documentation>Author of the textual content of a musical drama: see also A04 and A05</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A32">
+				<xs:annotation>
+					<xs:documentation>Contributions by</xs:documentation>
+					<xs:documentation>Author of additional contributions to the text</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A33">
+				<xs:annotation>
+					<xs:documentation>Appendix by</xs:documentation>
+					<xs:documentation>Author of appendix</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A34">
+				<xs:annotation>
+					<xs:documentation>Index by</xs:documentation>
+					<xs:documentation>Compiler of index</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A35">
+				<xs:annotation>
+					<xs:documentation>Drawings by</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A36">
+				<xs:annotation>
+					<xs:documentation>Cover design or artwork by</xs:documentation>
+					<xs:documentation>Use also for the cover artist of a graphic novel or comic book if named separately</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A37">
+				<xs:annotation>
+					<xs:documentation>Preliminary work by</xs:documentation>
+					<xs:documentation>Responsible for preliminary work on which the work is based</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A38">
+				<xs:annotation>
+					<xs:documentation>Original author</xs:documentation>
+					<xs:documentation>Author of the first edition (usually of a standard work) who is not an author of the current edition</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A39">
+				<xs:annotation>
+					<xs:documentation>Maps by</xs:documentation>
+					<xs:documentation>Maps drawn or otherwise contributed by</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A40">
+				<xs:annotation>
+					<xs:documentation>Inked or colored by</xs:documentation>
+					<xs:documentation>When separate persons are named as having respectively drawn and colored artwork, eg for a graphic novel or comic book, use A12 for 'drawn by' and A40 for 'colored by'</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A99">
+				<xs:annotation>
+					<xs:documentation>Other primary creator</xs:documentation>
+					<xs:documentation>Other type of primary creator not specified above</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B01">
+				<xs:annotation>
+					<xs:documentation>Edited by</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B02">
+				<xs:annotation>
+					<xs:documentation>Revised by</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B03">
+				<xs:annotation>
+					<xs:documentation>Retold by</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B04">
+				<xs:annotation>
+					<xs:documentation>Abridged by</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B05">
+				<xs:annotation>
+					<xs:documentation>Adapted by</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B06">
+				<xs:annotation>
+					<xs:documentation>Translated by</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B07">
+				<xs:annotation>
+					<xs:documentation>As told by</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B08">
+				<xs:annotation>
+					<xs:documentation>Translated with commentary by</xs:documentation>
+					<xs:documentation>This code applies where a translator has provided a commentary on issues relating to the translation. If the translator has also provided a commentary on the work itself, the name should be entered twice using codes B06 and A21.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B09">
+				<xs:annotation>
+					<xs:documentation>Series edited by</xs:documentation>
+					<xs:documentation>Name of a series editor when the product belongs to a series</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B10">
+				<xs:annotation>
+					<xs:documentation>Edited and translated by</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B11">
+				<xs:annotation>
+					<xs:documentation>Editor-in-chief</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B12">
+				<xs:annotation>
+					<xs:documentation>Guest editor</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B13">
+				<xs:annotation>
+					<xs:documentation>Volume editor</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B14">
+				<xs:annotation>
+					<xs:documentation>Editorial board member</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B15">
+				<xs:annotation>
+					<xs:documentation>Editorial coordination by</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B16">
+				<xs:annotation>
+					<xs:documentation>Managing editor</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B17">
+				<xs:annotation>
+					<xs:documentation>Founded by</xs:documentation>
+					<xs:documentation>Usually the founder editor of a serial publication: Begruendet von</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B18">
+				<xs:annotation>
+					<xs:documentation>Prepared for publication by</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B19">
+				<xs:annotation>
+					<xs:documentation>Associate editor</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B20">
+				<xs:annotation>
+					<xs:documentation>Consultant editor</xs:documentation>
+					<xs:documentation>Use also for 'advisory editor'</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B21">
+				<xs:annotation>
+					<xs:documentation>General editor</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B22">
+				<xs:annotation>
+					<xs:documentation>Dramatized by</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B23">
+				<xs:annotation>
+					<xs:documentation>General rapporteur</xs:documentation>
+					<xs:documentation>In Europe, an expert editor who takes responsibility for the legal content of a collaborative law volume</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B24">
+				<xs:annotation>
+					<xs:documentation>Literary editor</xs:documentation>
+					<xs:documentation>An editor who is responsible for establishing the text used in an edition of a literary work, where this is recognised as a distinctive role (in Spain, 'editor literario')</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B99">
+				<xs:annotation>
+					<xs:documentation>Other adaptation by</xs:documentation>
+					<xs:documentation>Other type of adaptation or editing not specified above</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="C01">
+				<xs:annotation>
+					<xs:documentation>Compiled by</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="C02">
+				<xs:annotation>
+					<xs:documentation>Selected by</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="C99">
+				<xs:annotation>
+					<xs:documentation>Other compilation by</xs:documentation>
+					<xs:documentation>Other type of compilation not specified above</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="D01">
+				<xs:annotation>
+					<xs:documentation>Producer</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="D02">
+				<xs:annotation>
+					<xs:documentation>Director</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="D03">
+				<xs:annotation>
+					<xs:documentation>Conductor</xs:documentation>
+					<xs:documentation>Conductor of a musical performance</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="D99">
+				<xs:annotation>
+					<xs:documentation>Other direction by</xs:documentation>
+					<xs:documentation>Other type of direction not specified above</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="E01">
+				<xs:annotation>
+					<xs:documentation>Actor</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="E02">
+				<xs:annotation>
+					<xs:documentation>Dancer</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="E03">
+				<xs:annotation>
+					<xs:documentation>Narrator</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="E04">
+				<xs:annotation>
+					<xs:documentation>Commentator</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="E05">
+				<xs:annotation>
+					<xs:documentation>Vocal soloist</xs:documentation>
+					<xs:documentation>Singer etc</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="E06">
+				<xs:annotation>
+					<xs:documentation>Instrumental soloist</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="E07">
+				<xs:annotation>
+					<xs:documentation>Read by</xs:documentation>
+					<xs:documentation>Reader of recorded text, as in an audiobook</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="E08">
+				<xs:annotation>
+					<xs:documentation>Performed by (orchestra, band, ensemble)</xs:documentation>
+					<xs:documentation>Name of a musical group in a performing role</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="E99">
+				<xs:annotation>
+					<xs:documentation>Performed by</xs:documentation>
+					<xs:documentation>Other type of performer not specified above: use for a recorded performance which does not fit a category above, eg a performance by a stand-up comedian.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="F01">
+				<xs:annotation>
+					<xs:documentation>Filmed/photographed by</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="F99">
+				<xs:annotation>
+					<xs:documentation>Other recording by</xs:documentation>
+					<xs:documentation>Other type of recording not specified above</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="Z01">
+				<xs:annotation>
+					<xs:documentation>Assisted by</xs:documentation>
+					<xs:documentation>May be associated with any contributor role, and placement should therefore be controlled by contributor sequence numbering</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="Z99">
+				<xs:annotation>
+					<xs:documentation>Other</xs:documentation>
+					<xs:documentation>Other creative responsibility not falling within A to F above</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List18">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 18">Person name type</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="00">
+				<xs:annotation>
+					<xs:documentation>Unspecified</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Pseudonym</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Authority-controlled name</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List19">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 19">Unnamed person(s)</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Unknown</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Anonymous</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>et al</xs:documentation>
+					<xs:documentation>And others: additional contributors not listed</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Various authors</xs:documentation>
+					<xs:documentation>When the product is a pack of books by different authors</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List20">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 20">Conference role</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string"/>
+	</xs:simpleType>
+	<xs:simpleType name="List21">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 21">Edition type code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="ABR">
+				<xs:annotation>
+					<xs:documentation>Abridged</xs:documentation>
+					<xs:documentation>Content has been shortened: use for abridged, shortened, concise, condensed.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ADP">
+				<xs:annotation>
+					<xs:documentation>Adapted</xs:documentation>
+					<xs:documentation>Content has been adapted to serve a different purpose or audience, or from one medium to another: use for dramatization, novelization etc. Use &lt;EditionStatement&gt; to describe the exact nature of the adaptation.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ALT">
+				<xs:annotation>
+					<xs:documentation>Alternate</xs:documentation>
+					<xs:documentation>Do not use. This code is now deprecated, but is retained in the list for reasons of upwards compatibility.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ANN">
+				<xs:annotation>
+					<xs:documentation>Annotated</xs:documentation>
+					<xs:documentation>Content is augmented by the addition of notes</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BLL">
+				<xs:annotation>
+					<xs:documentation>Bilingual edition</xs:documentation>
+					<xs:documentation>Both languages should be specified in the 'Language' group. Use MLL for an edition in more than two languages.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BRL">
+				<xs:annotation>
+					<xs:documentation>Braille</xs:documentation>
+					<xs:documentation>Braille edition</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CRI">
+				<xs:annotation>
+					<xs:documentation>Critical</xs:documentation>
+					<xs:documentation>Content includes critical commentary on the text</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CSP">
+				<xs:annotation>
+					<xs:documentation>Coursepack</xs:documentation>
+					<xs:documentation>Content was compiled for a specified educational course.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ENL">
+				<xs:annotation>
+					<xs:documentation>Enlarged</xs:documentation>
+					<xs:documentation>Content has been enlarged or expanded from that of a previous edition.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="EXP">
+				<xs:annotation>
+					<xs:documentation>Expurgated</xs:documentation>
+					<xs:documentation>‘Offensive' content has been removed</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="FAC">
+				<xs:annotation>
+					<xs:documentation>Facsimile</xs:documentation>
+					<xs:documentation>Exact reproduction of the content and format of a previous edition.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ILL">
+				<xs:annotation>
+					<xs:documentation>Illustrated</xs:documentation>
+					<xs:documentation>Content includes extensive illustrations which are not part of other editions</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="LTE">
+				<xs:annotation>
+					<xs:documentation>Large type / large print</xs:documentation>
+					<xs:documentation>Large print edition, print sizes 14 to 19 pt - see also ULP</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MCP">
+				<xs:annotation>
+					<xs:documentation>Microprint</xs:documentation>
+					<xs:documentation>A printed edition in a type size too small to be read without a magnifying glass</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MDT">
+				<xs:annotation>
+					<xs:documentation>Media tie-in</xs:documentation>
+					<xs:documentation>An edition published to coincide with the release of a film, TV program, or electronic game based on the same work. Use &lt;EditionStatement&gt; to describe the exact nature of the tie-in.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MLL">
+				<xs:annotation>
+					<xs:documentation>Multilingual edition</xs:documentation>
+					<xs:documentation>All languages should be specified in the 'Language' group. Use BLL for a bilingual edition.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NED">
+				<xs:annotation>
+					<xs:documentation>New edition</xs:documentation>
+					<xs:documentation>Where no other information is given, or no other coded type is applicable</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="REV">
+				<xs:annotation>
+					<xs:documentation>Revised</xs:documentation>
+					<xs:documentation>Content has been revised from that of a previous edition.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SCH">
+				<xs:annotation>
+					<xs:documentation>School edition</xs:documentation>
+					<xs:documentation>An edition intended specifically for use in schools.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SPE">
+				<xs:annotation>
+					<xs:documentation>Special edition</xs:documentation>
+					<xs:documentation>Use for anniversary, collectors’, de luxe, gift, limited, numbered, autographed edition. Use &lt;EditionStatement&gt; to describe the exact nature of the special edition.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="STU">
+				<xs:annotation>
+					<xs:documentation>Student edition</xs:documentation>
+					<xs:documentation>Where a text is available in both student and teacher’s editions.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TCH">
+				<xs:annotation>
+					<xs:documentation>Teacher’s edition</xs:documentation>
+					<xs:documentation>Where a text is available in both student and teacher’s editions; use also for instructor’s or leader’s editions.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="UBR">
+				<xs:annotation>
+					<xs:documentation>Unabridged</xs:documentation>
+					<xs:documentation>Where a title has also been published in an abridged edition; also for audiobooks, regardless of whether an abridged audio version also exists.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ULP">
+				<xs:annotation>
+					<xs:documentation>Ultra large print</xs:documentation>
+					<xs:documentation>For print sizes 20pt and above, and with typefaces designed for the visually impaired - see also LTE</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="UXP">
+				<xs:annotation>
+					<xs:documentation>Unexpurgated</xs:documentation>
+					<xs:documentation>Content previously considered 'offensive' has been restored</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="VAR">
+				<xs:annotation>
+					<xs:documentation>Variorum</xs:documentation>
+					<xs:documentation>Content includes notes by various commentators, and/or includes and compares several variant texts of the same work.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List22">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 22">Language role code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Language of text</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Original language of a translated text</xs:documentation>
+					<xs:documentation>Where the text in the original language is NOT part of the current product</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>Language of abstracts</xs:documentation>
+					<xs:documentation>Where different from language of text: used mainly for serials</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Rights language</xs:documentation>
+					<xs:documentation>Language to which specified rights apply</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>Rights-excluded language</xs:documentation>
+					<xs:documentation>Language to which specified rights do not apply</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>Original language in a multilingual edition</xs:documentation>
+					<xs:documentation>Where the text in the original language is part of a bilingual or multilingual edition</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="07">
+				<xs:annotation>
+					<xs:documentation>Translated language in a multilingual edition</xs:documentation>
+					<xs:documentation>Where the text in a translated language is part of a bilingual or multilingual edition</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List23">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 23">Extent type code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Number of words</xs:documentation>
+					<xs:documentation>Number of words of natural language text</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="09">
+				<xs:annotation>
+					<xs:documentation>Duration: use for running time</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="22">
+				<xs:annotation>
+					<xs:documentation>Filesize</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List24">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 24">Extent unit code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Words</xs:documentation>
+					<xs:documentation>Words of natural language text</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Hours (integer and decimals)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>Minutes (integer and decimals)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>Seconds (integer only)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="14">
+				<xs:annotation>
+					<xs:documentation>Hours HHH</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="15">
+				<xs:annotation>
+					<xs:documentation>Hours and minutes HHHMM</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="16">
+				<xs:annotation>
+					<xs:documentation>Hours minutes seconds HHHMMSS</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="18">
+				<xs:annotation>
+					<xs:documentation>Kbytes</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="19">
+				<xs:annotation>
+					<xs:documentation>Mbytes</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List25">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 25">Illustration and other content type code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Illustrations, black &amp; white</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Illustrations, color</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>Halftones, black &amp; white</xs:documentation>
+					<xs:documentation>Including black &amp; white photographs</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Halftones, color</xs:documentation>
+					<xs:documentation>Including color photographs</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>Line drawings, black &amp; white</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>Line drawings, color</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="07">
+				<xs:annotation>
+					<xs:documentation>Tables, black &amp; white</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="08">
+				<xs:annotation>
+					<xs:documentation>Tables, color</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="09">
+				<xs:annotation>
+					<xs:documentation>Illustrations, unspecified</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="10">
+				<xs:annotation>
+					<xs:documentation>Halftones, unspecified</xs:documentation>
+					<xs:documentation>Including photographs</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="11">
+				<xs:annotation>
+					<xs:documentation>Tables, unspecified</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="12">
+				<xs:annotation>
+					<xs:documentation>Line drawings, unspecified</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="13">
+				<xs:annotation>
+					<xs:documentation>Halftones, duotone</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="14">
+				<xs:annotation>
+					<xs:documentation>Maps</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="15">
+				<xs:annotation>
+					<xs:documentation>Frontispiece</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="16">
+				<xs:annotation>
+					<xs:documentation>Diagrams</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="17">
+				<xs:annotation>
+					<xs:documentation>Figures</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="18">
+				<xs:annotation>
+					<xs:documentation>Charts</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="19">
+				<xs:annotation>
+					<xs:documentation>Recorded music items</xs:documentation>
+					<xs:documentation>Recorded music extracts or examples, or complete recorded work(s), accompanying textual or other content</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="20">
+				<xs:annotation>
+					<xs:documentation>Printed music items</xs:documentation>
+					<xs:documentation>Printed music extracts or examples, or complete music score(s), accompanying textual or other content</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="21">
+				<xs:annotation>
+					<xs:documentation>Graphs</xs:documentation>
+					<xs:documentation>To be used in the mathematical sense of a diagram that represents numerical values plotted against an origin and axes, cf codes 16 and 18</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="22">
+				<xs:annotation>
+					<xs:documentation>Plates, unspecified</xs:documentation>
+					<xs:documentation>‘Plates’ means illustrations that are on separate pages bound into the body of a book</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="23">
+				<xs:annotation>
+					<xs:documentation>Plates, black &amp; white</xs:documentation>
+					<xs:documentation>‘Plates’ means illustrations that are on separate pages bound into the body of a book</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="24">
+				<xs:annotation>
+					<xs:documentation>Plates, color</xs:documentation>
+					<xs:documentation>‘Plates’ means illustrations that are on separate pages bound into the body of a book</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="25">
+				<xs:annotation>
+					<xs:documentation>Index</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="26">
+				<xs:annotation>
+					<xs:documentation>Bibliography</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List26">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 26">Main subject scheme identifier code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="09">
+				<xs:annotation>
+					<xs:documentation>UDC</xs:documentation>
+					<xs:documentation>Universal Decimal Classification. Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="10">
+				<xs:annotation>
+					<xs:documentation>BISAC category code</xs:documentation>
+					<xs:documentation>For information on BISAC subject categories, see http://www.bisg.org. Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="12">
+				<xs:annotation>
+					<xs:documentation>BIC subject category</xs:documentation>
+					<xs:documentation>For all BIC subject codes and qualifiers, see http://www.bic.org.uk/subcats.html. Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="25">
+				<xs:annotation>
+					<xs:documentation>Tabla de materias ISBN</xs:documentation>
+					<xs:documentation>Latin America. Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="26">
+				<xs:annotation>
+					<xs:documentation>Warengruppen-Systematik des deutschen Buchhandels</xs:documentation>
+					<xs:documentation>Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="28">
+				<xs:annotation>
+					<xs:documentation>Thèmes Electre</xs:documentation>
+					<xs:documentation>Subject classification used by Electre (France). Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="29">
+				<xs:annotation>
+					<xs:documentation>CLIL (France)</xs:documentation>
+					<xs:documentation>Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="30">
+				<xs:annotation>
+					<xs:documentation>DNB-Sachgruppen</xs:documentation>
+					<xs:documentation>Deutsche Bibliothek subject groups. Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="32">
+				<xs:annotation>
+					<xs:documentation>NUR</xs:documentation>
+					<xs:documentation>Nederlandstalige Uniforme Rubrieksindeling (Dutch book trade classification). Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="33">
+				<xs:annotation>
+					<xs:documentation>ECPA Christian Book Category</xs:documentation>
+					<xs:documentation>ECPA Christian Product Category Book Codes, consisting of up to three 3-letter blocks, for Super Category, Primary Category and Sub-Category. See http://www.ecpa.org/ECPA/cbacategories.xls. Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="35">
+				<xs:annotation>
+					<xs:documentation>Korean Decimal Classification (KDC)</xs:documentation>
+					<xs:documentation>A modified Dewey Decimal Classification used in the Republic of Korea. Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="36">
+				<xs:annotation>
+					<xs:documentation>DDC Deutsch</xs:documentation>
+					<xs:documentation>Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="40">
+				<xs:annotation>
+					<xs:documentation>Nippon Decimal Classification</xs:documentation>
+					<xs:documentation>Japanese subject classification scheme. Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="42">
+				<xs:annotation>
+					<xs:documentation>ANELE Materias</xs:documentation>
+					<xs:documentation>Spain: subject coding scheme of the Asociación Nacional de Editores de Libros y Material de Enseñanza. Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List27">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 27">Subject scheme identifier code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Dewey</xs:documentation>
+					<xs:documentation>Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Abridged Dewey</xs:documentation>
+					<xs:documentation>Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>LC class number</xs:documentation>
+					<xs:documentation>Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>LC subject heading</xs:documentation>
+					<xs:documentation>Text</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="09">
+				<xs:annotation>
+					<xs:documentation>UDC</xs:documentation>
+					<xs:documentation>Universal Decimal Classification. Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="10">
+				<xs:annotation>
+					<xs:documentation>BISAC category code</xs:documentation>
+					<xs:documentation>For information on BISAC subject categories, see http://www.bisg.org. Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="11">
+				<xs:annotation>
+					<xs:documentation>BISAC region code</xs:documentation>
+					<xs:documentation>A geographical qualifier used with a BISAC subject category. Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="12">
+				<xs:annotation>
+					<xs:documentation>BIC subject category</xs:documentation>
+					<xs:documentation>For all BIC subject codes and qualifiers, see http://www.bic.org.uk/subcats.html. Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="13">
+				<xs:annotation>
+					<xs:documentation>BIC geographical qualifier</xs:documentation>
+					<xs:documentation>Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="14">
+				<xs:annotation>
+					<xs:documentation>BIC language qualifier (language as subject)</xs:documentation>
+					<xs:documentation>Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="15">
+				<xs:annotation>
+					<xs:documentation>BIC time period qualifier</xs:documentation>
+					<xs:documentation>Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="16">
+				<xs:annotation>
+					<xs:documentation>BIC educational purpose qualifier</xs:documentation>
+					<xs:documentation>Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="17">
+				<xs:annotation>
+					<xs:documentation>BIC reading level &amp; special interest qualifier</xs:documentation>
+					<xs:documentation>Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="19">
+				<xs:annotation>
+					<xs:documentation>LC fiction genre heading</xs:documentation>
+					<xs:documentation>Text</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="20">
+				<xs:annotation>
+					<xs:documentation>Keywords</xs:documentation>
+					<xs:documentation>Text</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="21">
+				<xs:annotation>
+					<xs:documentation>BIC children’s book marketing category</xs:documentation>
+					<xs:documentation>See http://www.bic.org.uk/cbmc.html. Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="22">
+				<xs:annotation>
+					<xs:documentation>BISAC book merchandising code</xs:documentation>
+					<xs:documentation>For information on BISAC subject categories, see http://www.bisg.org. Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="23">
+				<xs:annotation>
+					<xs:documentation>Publisher’s own category code</xs:documentation>
+					<xs:documentation>Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="24">
+				<xs:annotation>
+					<xs:documentation>Proprietary subject scheme</xs:documentation>
+					<xs:documentation>Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="25">
+				<xs:annotation>
+					<xs:documentation>Tabla de materias ISBN</xs:documentation>
+					<xs:documentation>Latin America. Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="26">
+				<xs:annotation>
+					<xs:documentation>Warengruppen-Systematik des deutschen Buchhandels</xs:documentation>
+					<xs:documentation>Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="27">
+				<xs:annotation>
+					<xs:documentation>Schlagwort-Normdatei der Deutschen Bibliothek</xs:documentation>
+					<xs:documentation>Text</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="28">
+				<xs:annotation>
+					<xs:documentation>Thèmes Electre</xs:documentation>
+					<xs:documentation>Subject classification used by Electre (France). Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="29">
+				<xs:annotation>
+					<xs:documentation>CLIL</xs:documentation>
+					<xs:documentation>France. Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="30">
+				<xs:annotation>
+					<xs:documentation>DNB-Sachgruppen</xs:documentation>
+					<xs:documentation>Deutsche Bibliothek subject groups. Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="31">
+				<xs:annotation>
+					<xs:documentation>NUGI</xs:documentation>
+					<xs:documentation>Nederlandse Uniforme Genre-Indeling (former Dutch book trade classification). Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="32">
+				<xs:annotation>
+					<xs:documentation>NUR</xs:documentation>
+					<xs:documentation>Nederlandstalige Uniforme Rubrieksindeling (Dutch book trade classification, from 2002). Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="33">
+				<xs:annotation>
+					<xs:documentation>ECPA Christian Book Category</xs:documentation>
+					<xs:documentation>ECPA Christian Product Category Book Codes, consisting of up to three x 3-letter blocks, for Super Category, Primary Category and Sub-Category. See http://www.ecpa.org/ECPA/cbacategories.xls. Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="34">
+				<xs:annotation>
+					<xs:documentation>SISO</xs:documentation>
+					<xs:documentation>Schema Indeling Systematische Catalogus Openbare Bibliotheken (Dutch library classification). Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="35">
+				<xs:annotation>
+					<xs:documentation>Korean Decimal Classification (KDC)</xs:documentation>
+					<xs:documentation>A modified Dewey Decimal Classification used in the Republic of Korea. Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="36">
+				<xs:annotation>
+					<xs:documentation>DDC Deutsch</xs:documentation>
+					<xs:documentation>Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="37">
+				<xs:annotation>
+					<xs:documentation>Bokgrupper</xs:documentation>
+					<xs:documentation>Norwegian book trade product categories (4701)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="38">
+				<xs:annotation>
+					<xs:documentation>Varegrupper</xs:documentation>
+					<xs:documentation>Norwegian bookselling subject categories (4702)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="39">
+				<xs:annotation>
+					<xs:documentation>Læreplaner</xs:documentation>
+					<xs:documentation>Norwegian school curriculum version (4703)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="40">
+				<xs:annotation>
+					<xs:documentation>Nippon Decimal Classification</xs:documentation>
+					<xs:documentation>Japanese subject classification scheme. Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="41">
+				<xs:annotation>
+					<xs:documentation>BSQ</xs:documentation>
+					<xs:documentation>BookSelling Qualifier: Russian book trade classification. Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="42">
+				<xs:annotation>
+					<xs:documentation>ANELE Materias</xs:documentation>
+					<xs:documentation>Spain: subject coding scheme of the Asociación Nacional de Editores de Libros y Material de Enseñanza. Code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="43">
+				<xs:annotation>
+					<xs:documentation>Skolefag</xs:documentation>
+					<xs:documentation>Norwegian primary and secondary school subject categories (4705)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="44">
+				<xs:annotation>
+					<xs:documentation>Videregående</xs:documentation>
+					<xs:documentation>Norwegian list of categories used in higher secondary education and vocational training (4706)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="45">
+				<xs:annotation>
+					<xs:documentation>Undervisningsmateriell</xs:documentation>
+					<xs:documentation>Norwegian list of categories for books and other material used in education (4707)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="46">
+				<xs:annotation>
+					<xs:documentation>Norsk DDK</xs:documentation>
+					<xs:documentation>Norwegian version of Dewey Decimal Classification</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List28">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 28">Audience code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>General/trade</xs:documentation>
+					<xs:documentation>For a non-specialist adult audience</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Children/juvenile</xs:documentation>
+					<xs:documentation>For a juvenile audience, not specifically for any educational purpose</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>Young adult</xs:documentation>
+					<xs:documentation>For a teenage audience, not specifically for any educational purpose</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Primary &amp; secondary/elementary &amp; high school</xs:documentation>
+					<xs:documentation>Kindergarten, pre-school, primary/elementary or secondary/high school education</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>College/higher education</xs:documentation>
+					<xs:documentation>For universities and colleges of further and higher education</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>Professional and scholarly</xs:documentation>
+					<xs:documentation>For an expert adult audience, including academic research</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="07">
+				<xs:annotation>
+					<xs:documentation>ELT/ESL</xs:documentation>
+					<xs:documentation>Intended for use in teaching English as a second language</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="08">
+				<xs:annotation>
+					<xs:documentation>Adult education</xs:documentation>
+					<xs:documentation>For centres providing academic, vocational or recreational courses for adults</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List29">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 29">Audience code type</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>ONIX audience codes</xs:documentation>
+					<xs:documentation>Using List 28</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Proprietary</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>MPAA rating</xs:documentation>
+					<xs:documentation>Motion Picture Association of America rating applied to movies</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>BBFC rating</xs:documentation>
+					<xs:documentation>British Board of Film Classification rating applied to movies</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>FSK rating</xs:documentation>
+					<xs:documentation>German FSK (Freiwillige Selbstkontrolle der Filmwirtschaft) rating applied to movies</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>BTLF audience code</xs:documentation>
+					<xs:documentation>French Canadian audience code list, used by BTLF for Memento</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="07">
+				<xs:annotation>
+					<xs:documentation>Electre audience code</xs:documentation>
+					<xs:documentation>Audience code used by Electre (France)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="08">
+				<xs:annotation>
+					<xs:documentation>ANELE Tipo</xs:documentation>
+					<xs:documentation>Spain: educational audience and material type code of the Asociación Nacional de Editores de Libros y Material de Enseñanza</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List30">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 30">Audience range qualifier</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="11">
+				<xs:annotation>
+					<xs:documentation>US school grade range</xs:documentation>
+					<xs:documentation>Values for &lt;AudienceRangeValue&gt; are specified in List 77</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="12">
+				<xs:annotation>
+					<xs:documentation>UK school grade</xs:documentation>
+					<xs:documentation>Values are defined by BIC for England &amp; Wales, Scotland and N Ireland</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="16">
+				<xs:annotation>
+					<xs:documentation>Interest age, months</xs:documentation>
+					<xs:documentation>For use up to 30 months only: values in &lt;AudienceRangeValue&gt; must be integers</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="17">
+				<xs:annotation>
+					<xs:documentation>Interest age, years</xs:documentation>
+					<xs:documentation>Values in &lt;AudienceRangeValue&gt; must be integers</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="18">
+				<xs:annotation>
+					<xs:documentation>Reading age, years</xs:documentation>
+					<xs:documentation>Values in &lt;AudienceRangeValue&gt; must be integers</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="19">
+				<xs:annotation>
+					<xs:documentation>Spanish school grade</xs:documentation>
+					<xs:documentation>Spain: combined grade and region code, maintained by the Ministerio de Educación</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="20">
+				<xs:annotation>
+					<xs:documentation>Skoletrinn</xs:documentation>
+					<xs:documentation>Norwegian educational grades (4704)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List31">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 31">Audience range precision</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Exact</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>From</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>To</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List32">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 32">Complexity scheme identifier</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Lexile code</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Lexile number</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List33">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 33">Other text type code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Main description</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Short description/annotation</xs:documentation>
+					<xs:documentation>Limited to a maximum of 350 characters</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>Long description</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Table of contents</xs:documentation>
+					<xs:documentation>Used for a table of contents sent as a single text field, which may or may not carry structure expressed through HTML etc. Alternatively, a fully structured table of contents may be sent by using the &lt;ContentItem&gt; composite.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>Review quote, restricted length</xs:documentation>
+					<xs:documentation>A review quote that is restricted to a maximum length agreed between the sender and receiver of an ONIX file</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>Quote from review of previous edition</xs:documentation>
+					<xs:documentation>A review quote taken from a review of a previous edition of the work</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="07">
+				<xs:annotation>
+					<xs:documentation>Review text</xs:documentation>
+					<xs:documentation>Full text of a review of the product</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="08">
+				<xs:annotation>
+					<xs:documentation>Review quote</xs:documentation>
+					<xs:documentation>A quote from a review of the product</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="09">
+				<xs:annotation>
+					<xs:documentation>Promotional “headline”</xs:documentation>
+					<xs:documentation>A promotional phrase which is intended to headline a description of the product</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="10">
+				<xs:annotation>
+					<xs:documentation>Previous review quote</xs:documentation>
+					<xs:documentation>A quote from a review of a previous work by the same author(s) or in the same series</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="11">
+				<xs:annotation>
+					<xs:documentation>Author comments</xs:documentation>
+					<xs:documentation>May be part of Reading Group Guide material</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="12">
+				<xs:annotation>
+					<xs:documentation>Description for reader</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="13">
+				<xs:annotation>
+					<xs:documentation>Biographical note</xs:documentation>
+					<xs:documentation>A note referring to all contributors to a product – NOT linked to a single contributor</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="14">
+				<xs:annotation>
+					<xs:documentation>Description for Reading Group Guide</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="15">
+				<xs:annotation>
+					<xs:documentation>Discussion question for Reading Group Guide</xs:documentation>
+					<xs:documentation>Each instance must carry a single question</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="16">
+				<xs:annotation>
+					<xs:documentation>Competing titles</xs:documentation>
+					<xs:documentation>Free text listing of other titles with which the product is in competition: although this text might not appear in “public” ONIX records, it could be required where ONIX Is used as a communication format within a group of publishing and distribution companies</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="17">
+				<xs:annotation>
+					<xs:documentation>Flap copy</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="18">
+				<xs:annotation>
+					<xs:documentation>Back cover copy</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="19">
+				<xs:annotation>
+					<xs:documentation>Feature</xs:documentation>
+					<xs:documentation>Text describing a feature of a product to which the publisher wishes to draw attention for promotional purposes. Each separate feature should be described by a separate repeat, so that formatting can be applied at the discretion of the receiver of the ONIX record.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="20">
+				<xs:annotation>
+					<xs:documentation>New feature</xs:documentation>
+					<xs:documentation>As code 19, but used for a feature which is new in a new edition of the product.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="23">
+				<xs:annotation>
+					<xs:documentation>Excerpt from book</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="24">
+				<xs:annotation>
+					<xs:documentation>First chapter</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="25">
+				<xs:annotation>
+					<xs:documentation>Description for sales people</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="26">
+				<xs:annotation>
+					<xs:documentation>Description for press or other media</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="27">
+				<xs:annotation>
+					<xs:documentation>Description for subsidiary rights department</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="28">
+				<xs:annotation>
+					<xs:documentation>Description for teachers/educators</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="30">
+				<xs:annotation>
+					<xs:documentation>Unpublished endorsement</xs:documentation>
+					<xs:documentation>A quote usually provided by a celebrity to promote a new book, not from a review</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="31">
+				<xs:annotation>
+					<xs:documentation>Description for bookstore</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="32">
+				<xs:annotation>
+					<xs:documentation>Description for library</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="33">
+				<xs:annotation>
+					<xs:documentation>Introduction or preface</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="34">
+				<xs:annotation>
+					<xs:documentation>Full text</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List34">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 34">Text format code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="00">
+				<xs:annotation>
+					<xs:documentation>ASCII text</xs:documentation>
+					<xs:documentation>DEPRECATED: use code 06 or 07 as appropriate</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>SGML</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>HTML</xs:documentation>
+					<xs:documentation>Other than XHTML</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>XML</xs:documentation>
+					<xs:documentation>Other than XHTML</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>PDF</xs:documentation>
+					<xs:documentation>DEPRECATED: was formerly assigned both to PDF and to XHTML</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>XHTML</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>Default text format</xs:documentation>
+					<xs:documentation>Default: text in the encoding declared at the head of the message or in the XML default (UTF-8 or UTF-16) if there is no explicit declaration</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="07">
+				<xs:annotation>
+					<xs:documentation>Basic ASCII text</xs:documentation>
+					<xs:documentation>Plain text containing no tags of any kind, except for the tags &amp;amp; and &amp;lt; that XML insists must be used to represent ampersand and less-than characters in text; and with the character set limited to the ASCII range, i.e. valid UTF-8 characters whose character number lies between 32 (space) and 126 (tilde)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="08">
+				<xs:annotation>
+					<xs:documentation>PDF</xs:documentation>
+					<xs:documentation>Replaces 04 for the &lt;TextFormat&gt; element, but cannot of course be used as a textformat attribute</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List35">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 35">Text link type code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>URL</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>DOI</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>PURL</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>URN</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>FTP address</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>filename</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List36">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 36">Front cover image file format code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>GIF</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>JPEG</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>TIF</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List37">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 37">Front cover image file link type code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>URL</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>DOI</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>PURL</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>URN</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>FTP address</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>filename</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List38">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 38">Image/audio/video file type code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Whole product</xs:documentation>
+					<xs:documentation>Link to a location where the whole product may be found – used for epublications</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Software demo</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Front cover image</xs:documentation>
+					<xs:documentation>Quality unspecified: if sending both a standard quality and a high quality image, use 04 for standard quality and 06 for high quality</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>Front cover high quality image</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="07">
+				<xs:annotation>
+					<xs:documentation>Front cover thumbnail</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="08">
+				<xs:annotation>
+					<xs:documentation>Contributor image</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="10">
+				<xs:annotation>
+					<xs:documentation>Series image</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="11">
+				<xs:annotation>
+					<xs:documentation>Series logo</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="12">
+				<xs:annotation>
+					<xs:documentation>Product logo</xs:documentation>
+					<xs:documentation>Use only for a logo which is specific to an individual product</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="17">
+				<xs:annotation>
+					<xs:documentation>Publisher logo</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="18">
+				<xs:annotation>
+					<xs:documentation>Imprint logo</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="23">
+				<xs:annotation>
+					<xs:documentation>Inside page image</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="29">
+				<xs:annotation>
+					<xs:documentation>Video segment</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="30">
+				<xs:annotation>
+					<xs:documentation>Audio segment</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List39">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 39">Image/audio/video file format code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>GIF</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>JPEG</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>PDF</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>TIF</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>RealAudio 28.8</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="07">
+				<xs:annotation>
+					<xs:documentation>MP3</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="08">
+				<xs:annotation>
+					<xs:documentation>MPEG-4</xs:documentation>
+					<xs:documentation>MPEG-4 video file</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List40">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 40">Image/audio/video file link type</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>URL</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>DOI</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>PURL</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>URN</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>FTP address</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>filename</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List41">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 41">Prize or award achievement code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Winner</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Runner-up</xs:documentation>
+					<xs:documentation>Named as being in second place</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>Commended</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Short-listed</xs:documentation>
+					<xs:documentation>Nominated by the judging process to be one of the final 'short-list' from which the winner is selected</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>Long-listed</xs:documentation>
+					<xs:documentation>Nominated by the judging process to be one of the preliminary 'long-list' from which first a short-list and then the winner is selected</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>Joint winner</xs:documentation>
+					<xs:documentation>Or co-winner</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List42">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 42">Text item type code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Textual work</xs:documentation>
+					<xs:documentation>A complete work which is published as a content item in a product which carries two or more such works, eg when two or three novels are published in a single omnibus volume</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Front matter</xs:documentation>
+					<xs:documentation>Text components such as Preface, Introduction etc which appear as preliminaries to the main body of text content in a product</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>Body matter</xs:documentation>
+					<xs:documentation>Text components such as Part, Chapter, Section etc which appear as part of the main body of text content in a product</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Back matter</xs:documentation>
+					<xs:documentation>Text components such as Index which appear after the main body of text in a product</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="10">
+				<xs:annotation>
+					<xs:documentation>Serial item, miscellaneous or unspecified</xs:documentation>
+					<xs:documentation>For journals</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="11">
+				<xs:annotation>
+					<xs:documentation>Research article</xs:documentation>
+					<xs:documentation>For journals</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="12">
+				<xs:annotation>
+					<xs:documentation>Review article</xs:documentation>
+					<xs:documentation>For journals</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="13">
+				<xs:annotation>
+					<xs:documentation>Letter</xs:documentation>
+					<xs:documentation>For journals</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="14">
+				<xs:annotation>
+					<xs:documentation>Short communication</xs:documentation>
+					<xs:documentation>For journals</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="15">
+				<xs:annotation>
+					<xs:documentation>Erratum</xs:documentation>
+					<xs:documentation>For journals</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="16">
+				<xs:annotation>
+					<xs:documentation>Abstract</xs:documentation>
+					<xs:documentation>For journals</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="17">
+				<xs:annotation>
+					<xs:documentation>Book review (or review of other publication)</xs:documentation>
+					<xs:documentation>For journals</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="18">
+				<xs:annotation>
+					<xs:documentation>Editorial</xs:documentation>
+					<xs:documentation>For journals</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="19">
+				<xs:annotation>
+					<xs:documentation>Product review</xs:documentation>
+					<xs:documentation>For journals</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="20">
+				<xs:annotation>
+					<xs:documentation>Index</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="21">
+				<xs:annotation>
+					<xs:documentation>Obituary</xs:documentation>
+					<xs:documentation>For journals</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List43">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 43">Text item identifier type code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Proprietary</xs:documentation>
+					<xs:documentation>For example, a publisher’s own identifier</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>DOI</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="09">
+				<xs:annotation>
+					<xs:documentation>PII</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="10">
+				<xs:annotation>
+					<xs:documentation>SICI</xs:documentation>
+					<xs:documentation>For serial items only</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List44">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 44">Name code type</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Proprietary</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>Deutsche Bibliothek publisher identifier</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Börsenverein Verkehrsnummer</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>German ISBN Agency publisher identifier</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>EAN-UCC GLN</xs:documentation>
+					<xs:documentation>Global location number (formerly EAN location number)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="07">
+				<xs:annotation>
+					<xs:documentation>SAN</xs:documentation>
+					<xs:documentation>Book trade Standard Address Number - US, UK etc</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="10">
+				<xs:annotation>
+					<xs:documentation>Centraal Boekhuis Relatie ID</xs:documentation>
+					<xs:documentation>Trading party identifier used in the Netherlands</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List45">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 45">Publishing role code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Publisher</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Co-publisher</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>Sponsor</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Publisher of original-language version</xs:documentation>
+					<xs:documentation>Of a translated work</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>Host/distributor of electronic content</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>Published for/on behalf of</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="07">
+				<xs:annotation>
+					<xs:documentation>Published in association with</xs:documentation>
+					<xs:documentation>Use also for “Published in cooperation with”</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="08">
+				<xs:annotation>
+					<xs:documentation>Published on behalf of</xs:documentation>
+					<xs:documentation>DEPRECATED: use code 06</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="09">
+				<xs:annotation>
+					<xs:documentation>New or acquiring publisher</xs:documentation>
+					<xs:documentation>When ownership of a product or title is transferred from one publisher to another</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List46">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 46">Sales rights type code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>For sale with exclusive rights in the specified country/ies</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>For sale with non-exclusive rights in the specified country/ies</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>Not for sale in the specified country/ies</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List47">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 47">Rights region</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="000">
+				<xs:annotation>
+					<xs:documentation>World</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="001">
+				<xs:annotation>
+					<xs:documentation>World except territories specified elsewhere in rights statements</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="002">
+				<xs:annotation>
+					<xs:documentation>UK airports</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="003">
+				<xs:annotation>
+					<xs:documentation>UK 'open market'</xs:documentation>
+					<xs:documentation>Use when an open market edition is published under its own ISBN</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List48">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 48">Measure type code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Height</xs:documentation>
+					<xs:documentation>For a book, the spine height when standing on a shelf</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Width</xs:documentation>
+					<xs:documentation>For a book, the horizontal dimension of the cover when standing upright</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>Thickness</xs:documentation>
+					<xs:documentation>For a book, the thickness of the spine</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Page trim height</xs:documentation>
+					<xs:documentation>Not recommended for general use</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>Page trim width</xs:documentation>
+					<xs:documentation>Not recommended for general use</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="08">
+				<xs:annotation>
+					<xs:documentation>Unit weight</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="09">
+				<xs:annotation>
+					<xs:documentation>Diameter</xs:documentation>
+					<xs:documentation>Of a globe, for example</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List49">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 49">Rights territory code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="AU-CT">
+				<xs:annotation>
+					<xs:documentation>Australian Capital Territory</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AU-NS">
+				<xs:annotation>
+					<xs:documentation>New South Wales</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AU-NT">
+				<xs:annotation>
+					<xs:documentation>Northern Territory</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AU-QL">
+				<xs:annotation>
+					<xs:documentation>Queensland</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AU-SA">
+				<xs:annotation>
+					<xs:documentation>South Australia</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AU-TS">
+				<xs:annotation>
+					<xs:documentation>Tasmania</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AU-VI">
+				<xs:annotation>
+					<xs:documentation>Victoria</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AU-WA">
+				<xs:annotation>
+					<xs:documentation>Western Australia</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CA-AB">
+				<xs:annotation>
+					<xs:documentation>Alberta</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CA-BC">
+				<xs:annotation>
+					<xs:documentation>British Columbia</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CA-MB">
+				<xs:annotation>
+					<xs:documentation>Manitoba</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CA-NB">
+				<xs:annotation>
+					<xs:documentation>New Brunswick</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CA-NL">
+				<xs:annotation>
+					<xs:documentation>Newfoundland and Labrador</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CA-NS">
+				<xs:annotation>
+					<xs:documentation>Nova Scotia</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CA-NT">
+				<xs:annotation>
+					<xs:documentation>Northwest Territories</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CA-NU">
+				<xs:annotation>
+					<xs:documentation>Nunavut</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CA-ON">
+				<xs:annotation>
+					<xs:documentation>Ontario</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CA-PE">
+				<xs:annotation>
+					<xs:documentation>Prince Edward Island</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CA-QC">
+				<xs:annotation>
+					<xs:documentation>Quebec</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CA-SK">
+				<xs:annotation>
+					<xs:documentation>Saskatchewan</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CA-YT">
+				<xs:annotation>
+					<xs:documentation>Yukon Territory</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ES-CN">
+				<xs:annotation>
+					<xs:documentation>Canary Islands</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GB-AIR">
+				<xs:annotation>
+					<xs:documentation>UK airside</xs:documentation>
+					<xs:documentation>Airside outlets at UK international airports only</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GB-APS">
+				<xs:annotation>
+					<xs:documentation>UK airports</xs:documentation>
+					<xs:documentation>All UK airports, including both airside and other outlets</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GB-CHA">
+				<xs:annotation>
+					<xs:documentation>Channel Islands</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GB-ENG">
+				<xs:annotation>
+					<xs:documentation>England</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GB-EWS">
+				<xs:annotation>
+					<xs:documentation>England, Wales, Scotland</xs:documentation>
+					<xs:documentation>UK excluding Northern Ireland</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GB-IOM">
+				<xs:annotation>
+					<xs:documentation>Isle of Man</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GB-NIR">
+				<xs:annotation>
+					<xs:documentation>Northern Ireland</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GB-SCT">
+				<xs:annotation>
+					<xs:documentation>Scotland</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GB-WLS">
+				<xs:annotation>
+					<xs:documentation>Wales</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ROW">
+				<xs:annotation>
+					<xs:documentation>Rest of world</xs:documentation>
+					<xs:documentation>World except as otherwise specified</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="WORLD">
+				<xs:annotation>
+					<xs:documentation>World</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List50">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 50">Measure unit code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="cm">
+				<xs:annotation>
+					<xs:documentation>Centimeters</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="gr">
+				<xs:annotation>
+					<xs:documentation>Grams</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="in">
+				<xs:annotation>
+					<xs:documentation>Inches (US)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="lb">
+				<xs:annotation>
+					<xs:documentation>Pounds (US)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mm">
+				<xs:annotation>
+					<xs:documentation>Millimeters</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="oz">
+				<xs:annotation>
+					<xs:documentation>Ounces (US)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List51">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 51">Relation code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Includes</xs:documentation>
+					<xs:documentation>X includes Y (where the product described in the ONIX record is X and the related product is Y)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Is part of</xs:documentation>
+					<xs:documentation>X is part of Y – use for 'also available as part of'</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>Replaces</xs:documentation>
+					<xs:documentation>X replaces Y</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>Replaced by</xs:documentation>
+					<xs:documentation>X is replaced by Y </xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>Alternative format</xs:documentation>
+					<xs:documentation>X is available in an alternative format as Y – indicates an alternative format of the same content which is or may be available.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="07">
+				<xs:annotation>
+					<xs:documentation>Has ancillary product</xs:documentation>
+					<xs:documentation>X has an ancillary or supplementary product Y</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="08">
+				<xs:annotation>
+					<xs:documentation>Is ancillary to</xs:documentation>
+					<xs:documentation>X is ancillary or supplementary to Y</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="09">
+				<xs:annotation>
+					<xs:documentation>Is remaindered as</xs:documentation>
+					<xs:documentation>X is remaindered as Y, when a remainder merchant assigns its own identifier to the product</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="10">
+				<xs:annotation>
+					<xs:documentation>Is remainder of</xs:documentation>
+					<xs:documentation>X was originally sold as Y, indicating the publisher's original identifier for a title which is offered as a remainder under a different identifier</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="11">
+				<xs:annotation>
+					<xs:documentation>Is other-language version of</xs:documentation>
+					<xs:documentation>X is an other-language version of Y</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="12">
+				<xs:annotation>
+					<xs:documentation>Publisher’s suggested alternative</xs:documentation>
+					<xs:documentation>X has a publisher's suggested alternative Y, which does not, however, carry the same content (cf 05 and 06)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="13">
+				<xs:annotation>
+					<xs:documentation>Epublication based on (print product)</xs:documentation>
+					<xs:documentation>X is an epublication based on printed product Y</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="14">
+				<xs:annotation>
+					<xs:documentation>Epublication is distributed as</xs:documentation>
+					<xs:documentation>X is an epublication 'rendered' as Y – use when the ONIX record describes a package of electronic content which is available in multiple 'renderings'</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="15">
+				<xs:annotation>
+					<xs:documentation>Epublication is a rendering of</xs:documentation>
+					<xs:documentation>X is a 'rendering' of an epublication Y – use when the ONIX record describes a specific rendering of an epublication content package, to identify the package</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="16">
+				<xs:annotation>
+					<xs:documentation>POD replacement for</xs:documentation>
+					<xs:documentation>X is a POD replacement for Y – Y is an out-of-print product replaced by a print-on-demand version under a new ISBN</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="17">
+				<xs:annotation>
+					<xs:documentation>Replaced by POD</xs:documentation>
+					<xs:documentation>X is replaced by POD Y – Y is a print-on-demand replacement, under a new ISBN, for an out-of-print product X</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List52">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 52">Supply-to region code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="004">
+				<xs:annotation>
+					<xs:documentation>UK 'open market'</xs:documentation>
+					<xs:documentation>When the same ISBN is used for open market and UK editions</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List53">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 53">Returns conditions code type</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>French book trade returns conditions code</xs:documentation>
+					<xs:documentation>Maintained by CLIL (Commission Interprofessionnel du Livre)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>BISAC Returnable Indicator code</xs:documentation>
+					<xs:documentation>Maintained by BISAC: see List 66</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>UK book trade returns conditions code</xs:documentation>
+					<xs:documentation>NOT CURRENTLY USED - BIC has decided that it will not maintain a code list for this purpose, since returns conditions are usually at least partly based on the trading relationship</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List54">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 54">Availability status code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="AB">
+				<xs:annotation>
+					<xs:documentation>Cancelled</xs:documentation>
+					<xs:documentation>Publication abandoned after having been announced</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AD">
+				<xs:annotation>
+					<xs:documentation>Available direct from publisher only</xs:documentation>
+					<xs:documentation>Apply direct to publisher, item not available to trade</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CS">
+				<xs:annotation>
+					<xs:documentation>Availability uncertain</xs:documentation>
+					<xs:documentation>Check with customer service</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="EX">
+				<xs:annotation>
+					<xs:documentation>No longer stocked by us</xs:documentation>
+					<xs:documentation>Wholesaler or vendor only</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="IP">
+				<xs:annotation>
+					<xs:documentation>Available</xs:documentation>
+					<xs:documentation>In-print and in stock</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MD">
+				<xs:annotation>
+					<xs:documentation>Manufactured on demand</xs:documentation>
+					<xs:documentation>May be accompanied by an estimated average time to supply</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NP">
+				<xs:annotation>
+					<xs:documentation>Not yet published</xs:documentation>
+					<xs:documentation>MUST be accompanied by an expected availability date</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NY">
+				<xs:annotation>
+					<xs:documentation>Newly catalogued, not yet in stock</xs:documentation>
+					<xs:documentation>Wholesaler or vendor only: MUST be accompanied by expected availability date</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="OF">
+				<xs:annotation>
+					<xs:documentation>Other format available</xs:documentation>
+					<xs:documentation>This format is out of print, but another format is available: should be accompanied by an identifier for the alternative product</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="OI">
+				<xs:annotation>
+					<xs:documentation>Out of stock indefinitely</xs:documentation>
+					<xs:documentation>No current plan to reprint</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="OP">
+				<xs:annotation>
+					<xs:documentation>Out of print</xs:documentation>
+					<xs:documentation>Discontinued, deleted from catalogue</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="OR">
+				<xs:annotation>
+					<xs:documentation>Replaced by new edition</xs:documentation>
+					<xs:documentation>This edition is out of print, but a new edition has been or will soon be published: should be accompanied by an identifier for the new edition</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PP">
+				<xs:annotation>
+					<xs:documentation>Publication postponed indefinitely</xs:documentation>
+					<xs:documentation>Publication has been announced, and subsequently postponed with no new date</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="RF">
+				<xs:annotation>
+					<xs:documentation>Refer to another supplier</xs:documentation>
+					<xs:documentation>Supply of this item has been transferred to another publisher or distributor: should be accompanied by an identifier for the new supplier</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="RM">
+				<xs:annotation>
+					<xs:documentation>Remaindered</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="RP">
+				<xs:annotation>
+					<xs:documentation>Reprinting</xs:documentation>
+					<xs:documentation>MUST be accompanied by an expected availability date</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="RU">
+				<xs:annotation>
+					<xs:documentation>Reprinting, undated</xs:documentation>
+					<xs:documentation>Use instead of RP as a last resort, only if it is really impossible to give an expected availability date</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TO">
+				<xs:annotation>
+					<xs:documentation>Special order</xs:documentation>
+					<xs:documentation>This item is not stocked but has to be specially ordered from a supplier (eg import item not stocked locally): may be accompanied by an estimated average time to supply</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TP">
+				<xs:annotation>
+					<xs:documentation>Temporarily out of stock because publisher cannot supply</xs:documentation>
+					<xs:documentation>Wholesaler or vendor only</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TU">
+				<xs:annotation>
+					<xs:documentation>Temporarily unavailable</xs:documentation>
+					<xs:documentation>MUST be accompanied by an expected availability date</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="UR">
+				<xs:annotation>
+					<xs:documentation>Unavailable, awaiting reissue</xs:documentation>
+					<xs:documentation>The item is out of stock but will be reissued under the same ISBN: MUST be accompanied by an expected availability date and by the reissue date in the &lt;Reissue&gt; composite. See notes on the &lt;Reissue&gt; composite for details on treatment of availability status during reissue.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="WR">
+				<xs:annotation>
+					<xs:documentation>Will be remaindered as of (date)</xs:documentation>
+					<xs:documentation>MUST be accompanied by the remainder date</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="WS">
+				<xs:annotation>
+					<xs:documentation>Withdrawn from sale</xs:documentation>
+					<xs:documentation>Typically, withdrawn indefinitely for legal reasons</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List55">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 55">Date format</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="00">
+				<xs:annotation>
+					<xs:documentation>YYYYMMDD</xs:documentation>
+					<xs:documentation>Year month day (default)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>YYYYMM</xs:documentation>
+					<xs:documentation>Year and month</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>YYYYWW</xs:documentation>
+					<xs:documentation>Year and week number</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>YYYYQ</xs:documentation>
+					<xs:documentation>Year and quarter (Q = 1, 2, 3, 4)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>YYYYS</xs:documentation>
+					<xs:documentation>Year and season (S = 1, 2, 3, 4, with 1 = “Spring”)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>YYYY</xs:documentation>
+					<xs:documentation>Year</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>YYYYMMDDYYYYMMDD</xs:documentation>
+					<xs:documentation>Spread of exact dates</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="07">
+				<xs:annotation>
+					<xs:documentation>YYYYMMYYYYMM</xs:documentation>
+					<xs:documentation>Spread of months</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="08">
+				<xs:annotation>
+					<xs:documentation>YYYYWWYYYYWW</xs:documentation>
+					<xs:documentation>Spread of week numbers</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="09">
+				<xs:annotation>
+					<xs:documentation>YYYYQYYYYQ</xs:documentation>
+					<xs:documentation>Spread of quarters</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="10">
+				<xs:annotation>
+					<xs:documentation>YYYYSYYYYS</xs:documentation>
+					<xs:documentation>Spread of seasons</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="11">
+				<xs:annotation>
+					<xs:documentation>YYYYYYYY</xs:documentation>
+					<xs:documentation>Spread of years</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="12">
+				<xs:annotation>
+					<xs:documentation>Text string</xs:documentation>
+					<xs:documentation>For complex, approximate or uncertain dates</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List56">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 56">Audience restriction flag</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="R">
+				<xs:annotation>
+					<xs:documentation>Restrictions apply, see note</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="X">
+				<xs:annotation>
+					<xs:documentation>Indiziert</xs:documentation>
+					<xs:documentation>Indexed for the German market - in Deutschland indiziert</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List57">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 57">Unpriced item type code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Free of charge</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Price to be announced</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>Not sold separately</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Contact publisher or supplier</xs:documentation>
+					<xs:documentation>May be used for books that do not carry a recommended retail price, when an ONIX file is “broadcast” rather than sent one-to-one to a single trading partner.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List58">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 58">Price type code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>RRP excluding any sales tax or value-added tax</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>RRP including sales or value-added tax if applicable</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>Fixed retail price excluding tax</xs:documentation>
+					<xs:documentation>In countries where retail price maintenance applies by law to certain products: not used in USA</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Fixed retail price including tax</xs:documentation>
+					<xs:documentation>In countries where retail price maintenance applies by law to certain products: not used in USA</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>Supplier’s unit cost price excluding any sales tax or value-added tax: goods for retail sale</xs:documentation>
+					<xs:documentation>In North America, this may be referred to as 'net price'</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>Supplier’s unit cost price excluding any sales tax or value-added tax: rental goods</xs:documentation>
+					<xs:documentation>Used for video and DVD</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="11">
+				<xs:annotation>
+					<xs:documentation>Special sale RRP excluding any sales tax or value-added tax</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="12">
+				<xs:annotation>
+					<xs:documentation>Special sale RRP including sales or value-added tax if applicable</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="13">
+				<xs:annotation>
+					<xs:documentation>Special sale fixed retail price excluding tax</xs:documentation>
+					<xs:documentation>In countries where retail price maintenance applies by law to certain products: not used in USA</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="14">
+				<xs:annotation>
+					<xs:documentation>Special sale fixed retail price including tax</xs:documentation>
+					<xs:documentation>In countries where retail price maintenance applies by law to certain products: not used in USA</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="15">
+				<xs:annotation>
+					<xs:documentation>Supplier’s unit cost price for special sale excluding any sales tax or value-added tax</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="21">
+				<xs:annotation>
+					<xs:documentation>Pre-publication RRP excluding any sales tax or value-added tax</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="22">
+				<xs:annotation>
+					<xs:documentation>Pre-publication RRP including sales or value-added tax if applicable</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="23">
+				<xs:annotation>
+					<xs:documentation>Pre-publication fixed retail price excluding tax</xs:documentation>
+					<xs:documentation>In countries where retail price maintenance applies by law to certain products: not used in USA</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="24">
+				<xs:annotation>
+					<xs:documentation>Pre-publication fixed retail price including tax</xs:documentation>
+					<xs:documentation>In countries where retail price maintenance applies by law to certain products: not used in USA</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="25">
+				<xs:annotation>
+					<xs:documentation>Supplier’s pre-publication unit cost price excluding tax</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="31">
+				<xs:annotation>
+					<xs:documentation>Freight-pass-through RRP excluding tax</xs:documentation>
+					<xs:documentation>In the US, books are sometimes supplied on 'freight-pass-through' terms, where a price that is different from the RRP is used as the basis for calculating the supplier’s charge to a reseller. To make it clear when such terms are being invoked, code 31 is used instead of code 01 to indicate the RRP. Code 32 is used for the 'billing price'.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="32">
+				<xs:annotation>
+					<xs:documentation>Freight-pass-through billing price excluding tax</xs:documentation>
+					<xs:documentation>When freight-pass-through terms apply, the price on which the supplier’s charge to a reseller is calculated, ie the price to which trade discount terms are applied. See also code 31.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List59">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 59">Price type qualifier</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Member/subscriber price</xs:documentation>
+					<xs:documentation>Price applies to a designated group membership</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Export price</xs:documentation>
+					<xs:documentation>Price applies to sales outside the territory in which the supplier is located</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>Reduced price applicable when the item is purchased as part of a set</xs:documentation>
+					<xs:documentation>Use in cases where there is no combined set price, but a lower price is offered for each part if the whole set is purchased</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Voucher price</xs:documentation>
+					<xs:documentation>In the Netherlands (or any other market where similar arrangements exist): a reduced fixed price available for a limited time on presentation of a voucher published in a specified medium, eg a newspaper. Should be accompanied by &lt;PriceTypeCode&gt; 13 and additional detail in &lt;PriceTypeDescription&gt;, and by validity dates in &lt;PriceEffectiveFrom&gt; and &lt;PriceEffectiveUntil&gt;.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List60">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 60">Unit of pricing code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="00">
+				<xs:annotation>
+					<xs:documentation>Per copy of whole product</xs:documentation>
+					<xs:documentation>Default</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Per page for printed loose-leaf content only</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List61">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 61">Price status code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="00">
+				<xs:annotation>
+					<xs:documentation>Unspecified</xs:documentation>
+					<xs:documentation>Default</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Provisional</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Firm</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List62">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 62">Tax rate, coded</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="H">
+				<xs:annotation>
+					<xs:documentation>Higher rate</xs:documentation>
+					<xs:documentation>Specifies that tax is applied at a higher rate than standard</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="R">
+				<xs:annotation>
+					<xs:documentation>Lower rate</xs:documentation>
+					<xs:documentation>Specifies that tax is applied at a lower rate than standard</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="S">
+				<xs:annotation>
+					<xs:documentation>Standard rate</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="Z">
+				<xs:annotation>
+					<xs:documentation>Zero-rated</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List63">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 63">Intermediary supplier availability</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string"/>
+	</xs:simpleType>
+	<xs:simpleType name="List64">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 64">Publishing status</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="00">
+				<xs:annotation>
+					<xs:documentation>Unspecified</xs:documentation>
+					<xs:documentation>Status is not specified (as distinct from unknown): the default if the &lt;PublishingStatus&gt; element is not sent. Also to be used in applications where the element is considered mandatory, but the sender of the ONIX message chooses not to pass on status information.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Cancelled</xs:documentation>
+					<xs:documentation>The product was announced, and subsequently abandoned; the &lt;PublicationDate&gt; element must not be sent.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Forthcoming</xs:documentation>
+					<xs:documentation>Not yet published, must be accompanied by expected date in &lt;PublicationDate&gt;.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>Postponed indefinitely</xs:documentation>
+					<xs:documentation>The product was announced, and subsequently postponed with no expected publication date; the&lt;Publication Date&gt; element must not be sent.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Active</xs:documentation>
+					<xs:documentation>The product was published, and is still active in the sense that the publisher will accept orders for it, though it may or may not be immediately available, for which see &lt;SupplyDetail&gt;.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>No longer our product</xs:documentation>
+					<xs:documentation>Ownership of the product has been transferred to another publisher (with details of acquiring publisher if possible in PR.19).</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>Out of stock indefinitely</xs:documentation>
+					<xs:documentation>The product was active, but is now inactive in the sense that (a) the publisher will not accept orders for it, though stock may still be available elsewhere in the supply chain, and (b) there are no current plans to bring it back into stock. Code 06 does not specifically imply that returns are or are not still accepted.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="07">
+				<xs:annotation>
+					<xs:documentation>Out of print</xs:documentation>
+					<xs:documentation>The product was active, but is now permanently inactive in the sense that (a) the publisher will not accept orders for it, though stock may still be available elsewhere in the supply chain, and (b) the product will not be made available again under the same ISBN. Code 07 normally implies that the publisher will not accept returns beyond a specified date.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="08">
+				<xs:annotation>
+					<xs:documentation>Inactive</xs:documentation>
+					<xs:documentation>The product was active, but is now permanently or indefinitely inactive in the sense that the publisher will not accept orders for it, though stock may still be available elsewhere in the supply chain. Code 08 covers both of codes 06 and 07, and may be used where the distinction between those values is either unnecessary or meaningless.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="09">
+				<xs:annotation>
+					<xs:documentation>Unknown</xs:documentation>
+					<xs:documentation>The sender of the ONIX record does not know the current publishing status.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="10">
+				<xs:annotation>
+					<xs:documentation>Remaindered</xs:documentation>
+					<xs:documentation>The product is no longer available from the current publisher, under the current ISBN, at the current price. It may be available to be traded through another channel. A Publishing Status code 10 'Remaindered' usually but not always means that the publisher has decided to sell off excess inventory of the book. Copies of books that are remaindered are often made available in the supply chain at a reduced price. However, such remainders are often sold under a product identifier that differs from the ISBN on the full-priced copy of the book. A Publishing Status code 10 'Remaindered' on a given product record may or may not be followed by a Publishing Status code 06 'Out of Stock Indefinitely' or 07 'Out of Print': the practise varies from one publisher to another. Some publishers may revert to a Publishing Status code 04 “Active” if a desired inventory level on the product in question has subsequently been reached. No change in rights should ever be inferred from this (or any other) Publishing Status code value.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List65">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 65">Product availability</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Cancelled</xs:documentation>
+					<xs:documentation>Cancelled: product was announced, and subsequently abandoned</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="10">
+				<xs:annotation>
+					<xs:documentation>Not yet available</xs:documentation>
+					<xs:documentation>Not yet available (requires &lt;ExpectedShipDate&gt;, except in exceptional circumstances where no date is known)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="11">
+				<xs:annotation>
+					<xs:documentation>Awaiting stock</xs:documentation>
+					<xs:documentation>Not yet available, but will be a stock item when available (requires &lt;ExpectedShipDate&gt;, except in exceptional circumstances where no date is known). Used particularly for imports which have been published in the country of origin but have not yet arrived in the importing country.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="12">
+				<xs:annotation>
+					<xs:documentation>Not yet available, will be POD</xs:documentation>
+					<xs:documentation>Not yet available, to be published as print-on-demand only. May apply either to a POD successor to an existing conventional edition, when the successor will be published under a different ISBN (normally because different trade terms apply); or to a title that is being published as a POD original.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="20">
+				<xs:annotation>
+					<xs:documentation>Available</xs:documentation>
+					<xs:documentation>Available from us (form of availability unspecified)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="21">
+				<xs:annotation>
+					<xs:documentation>In stock</xs:documentation>
+					<xs:documentation>Available from us as a stock item</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="22">
+				<xs:annotation>
+					<xs:documentation>To order</xs:documentation>
+					<xs:documentation>Available from us as a non-stock item, by special order</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="23">
+				<xs:annotation>
+					<xs:documentation>Manufactured on demand</xs:documentation>
+					<xs:documentation>Available from us by manufacture on demand</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="30">
+				<xs:annotation>
+					<xs:documentation>Temporarily unavailable</xs:documentation>
+					<xs:documentation>Temporarily unavailable: temporarily unavailable from us (reason unspecified) (requires &lt;ExpectedShipDate&gt;, except in exceptional circumstances where no date is known)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="31">
+				<xs:annotation>
+					<xs:documentation>Out of stock</xs:documentation>
+					<xs:documentation>Stock item, temporarily out of stock (requires &lt;ExpectedShipDate&gt;, except in exceptional circumstances where no date is known)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="32">
+				<xs:annotation>
+					<xs:documentation>Reprinting</xs:documentation>
+					<xs:documentation>Temporarily unavailable, reprinting (requires &lt;ExpectedShipDate&gt;, except in exceptional circumstances where no date is known)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="33">
+				<xs:annotation>
+					<xs:documentation>Awaiting reissue</xs:documentation>
+					<xs:documentation>Temporarily unavailable, awaiting reissue (requires the &lt;Reissue&gt; composite, and &lt;ExpectedShipDate&gt;, except in exceptional circumstances where no date is known)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="40">
+				<xs:annotation>
+					<xs:documentation>Not available</xs:documentation>
+					<xs:documentation>Not available from us (reason unspecified; if the reason is rights-related, it should be specified in PR.21)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="41">
+				<xs:annotation>
+					<xs:documentation>Replaced by new product</xs:documentation>
+					<xs:documentation>This product is unavailable, but a successor product or edition is or will be available from us (identify successor in &lt;RelatedProduct&gt;)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="42">
+				<xs:annotation>
+					<xs:documentation>Other format available</xs:documentation>
+					<xs:documentation>This product is unavailable, but the same content is or will be available from us in an alternative format (identify other format product in &lt;RelatedProduct&gt;)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="43">
+				<xs:annotation>
+					<xs:documentation>No longer supplied by us</xs:documentation>
+					<xs:documentation>Identify new supplier in &lt;NewSupplier&gt; if possible</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="44">
+				<xs:annotation>
+					<xs:documentation>Apply direct</xs:documentation>
+					<xs:documentation>Not available to trade, apply direct to publisher</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="45">
+				<xs:annotation>
+					<xs:documentation>Not sold separately</xs:documentation>
+					<xs:documentation>Must be bought as part of a set (identify set in &lt;RelatedProduct&gt;)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="46">
+				<xs:annotation>
+					<xs:documentation>Withdrawn from sale</xs:documentation>
+					<xs:documentation>May be for legal reasons or to avoid giving offence</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="47">
+				<xs:annotation>
+					<xs:documentation>Remaindered</xs:documentation>
+					<xs:documentation>Remaindered</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="48">
+				<xs:annotation>
+					<xs:documentation>Out of print, replaced by POD</xs:documentation>
+					<xs:documentation>Out of print, but a print-on-demand edition is or will be available under a different ISBN. Use only when the POD successor has a different ISBN, normally because different trade terms apply.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="99">
+				<xs:annotation>
+					<xs:documentation>Uncertain</xs:documentation>
+					<xs:documentation>Apply to customer service</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List66">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 66">BISAC returnable indicator</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="Y">
+				<xs:annotation>
+					<xs:documentation>Yes, returnable, full copies only</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="N">
+				<xs:annotation>
+					<xs:documentation>No, not returnable</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="C">
+				<xs:annotation>
+					<xs:documentation>Conditional</xs:documentation>
+					<xs:documentation>Contact publisher for requirements and/or authorization</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="S">
+				<xs:annotation>
+					<xs:documentation>Yes, returnable, stripped cover</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List67">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 67">Market date role</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Local publication date</xs:documentation>
+					<xs:documentation>The date on which the product is expected to be first published in this market, or – after publication – the date on which it was published in this market. There may or may not be a strict embargo on retail sales before the expected date; if there is, it should be specified separately as an embargo date.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Consumer on sale date / embargo date</xs:documentation>
+					<xs:documentation>If there is an embargo on retail sales in this market before a certain date, the date from which the embargo is lifted and retail sales are permitted</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List68">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 68">Market publishing status</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="00">
+				<xs:annotation>
+					<xs:documentation>Unspecified</xs:documentation>
+					<xs:documentation>Status is not specified (as distinct from unknown): the default if the &lt;MarketPublishingStatus&gt; element is not sent.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Cancelled</xs:documentation>
+					<xs:documentation>The product was announced for publication in this market, and subsequently abandoned.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Forthcoming</xs:documentation>
+					<xs:documentation>Not yet published in this market, should be accompanied by expected local publication date..</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>Postponed indefinitely</xs:documentation>
+					<xs:documentation>The product was announced for publication in this market, and subsequently postponed with no expected local publication date.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Active</xs:documentation>
+					<xs:documentation>The product was published in this market, and is still active in the sense that the publisher will accept orders for it, though it may or may not be immediately available, for which see &lt;SupplyDetail&gt;.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>No longer our product</xs:documentation>
+					<xs:documentation>Responsibility for the product in this market has been transferred elsewhere.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>Out of stock indefinitely</xs:documentation>
+					<xs:documentation>The product was active, but is now inactive in the sense that (a) no further stock is expected to be made available in this market, though stock may still be available elsewhere in the supply chain, and (b) there are no current plans to bring it back into stock.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="07">
+				<xs:annotation>
+					<xs:documentation>Out of print</xs:documentation>
+					<xs:documentation>The product was active, but is now permanently inactive in the sense that (a) no further stock is expected to be made available in this market, though stock may still be available elsewhere in the supply chain, and (b) the product will not be made available again under the same ISBN.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="08">
+				<xs:annotation>
+					<xs:documentation>Inactive</xs:documentation>
+					<xs:documentation>The product was active, but is now permanently or indefinitely inactive in the sense that no further stock is expected to be made available in this market, though stock may still be available elsewhere in the supply chain. Code 08 covers both of codes 06 and 07, and may be used where the distinction between those values is either unnecessary or meaningless.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="09">
+				<xs:annotation>
+					<xs:documentation>Unknown</xs:documentation>
+					<xs:documentation>The sender of the ONIX record does not know the current publishing status in this market.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="10">
+				<xs:annotation>
+					<xs:documentation>Remaindered</xs:documentation>
+					<xs:documentation>The product is no longer available in this market from the local publisher, under the current ISBN, at the current price. It may be available to be traded through another channel, usually at a reduced price.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="11">
+				<xs:annotation>
+					<xs:documentation>Withdrawn from sale</xs:documentation>
+					<xs:documentation>Withdrawn from sale in this market, typically for legal reasons</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="12">
+				<xs:annotation>
+					<xs:documentation>Not available in this market</xs:documentation>
+					<xs:documentation>Either no rights are held for the product in this market, or for other reasons the publisher has decided not to make it available in this market</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="13">
+				<xs:annotation>
+					<xs:documentation>Active, but not sold separately</xs:documentation>
+					<xs:documentation>The product is published in this market and active but, as a publishing decision, it is not sold separately – only in an assembly or as part of a package</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="14">
+				<xs:annotation>
+					<xs:documentation>Active, with market restrictions</xs:documentation>
+					<xs:documentation>The product is published in this market and active, but is not available to all customer types, typically because the market is split between exclusive sales agents for different market segments. Should be accompanied by a free-text statement in &lt;MarketRestrictionDetail&gt; describing the nature of the restriction.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List69">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 69">Agent role</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>Exclusive sales agent</xs:documentation>
+					<xs:documentation>Publisher's exclusive sales agent in a specified territory</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>Non-exclusive sales agent</xs:documentation>
+					<xs:documentation>Publisher's non-exclusive sales agent in a specified territory</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="07">
+				<xs:annotation>
+					<xs:documentation>Local publisher</xs:documentation>
+					<xs:documentation>Publisher for a specified territory</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List70">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 70">Stock quantity code type</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Proprietary</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>APA stock quantity code</xs:documentation>
+					<xs:documentation>Code scheme defined by the Australian Publishers Association</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List71">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 71">Sales restriction type code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="00">
+				<xs:annotation>
+					<xs:documentation>Unspecified - see text</xs:documentation>
+					<xs:documentation>Restriction must be described in &lt;SalesRestrictionDetail&gt;</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Retailer exclusive / own brand</xs:documentation>
+					<xs:documentation>For sale only through designated retailer. Retailer must be named in &lt;SalesOutletName&gt;. Use only when it is not possible to assign the more explicit code 04 or 05.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Office supplies edition</xs:documentation>
+					<xs:documentation>For editions sold only though office supplies wholesalers. Retailer(s) and/or distributor(s) may be named in &lt;SalesOutletName&gt;</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>Internal publisher use only: do not list</xs:documentation>
+					<xs:documentation>For an ISBN that is assigned for a publisher's internal purposes</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Retailer exclusive</xs:documentation>
+					<xs:documentation>For sale only through designated retailer, though not under retailer's own brand/imprint. Retailer must be named in &lt;SalesOutletName&gt;.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>Retailer own brand</xs:documentation>
+					<xs:documentation>For sale only through designated retailer under retailer's own brand/imprint. Retailer must be named in &lt;SalesOutletName&gt;.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>Library edition</xs:documentation>
+					<xs:documentation>For sale to libraries only; not for sale through retail trade</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List72">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 72">Thesis type code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Habilitationsschrift</xs:documentation>
+					<xs:documentation>Professorial dissertation (thesis for postdoctoral lecturing qualification)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Dissertationsschrift</xs:documentation>
+					<xs:documentation>Doctoral thesis</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>Staatsexamensarbeit</xs:documentation>
+					<xs:documentation>State examination thesis</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Magisterarbeit</xs:documentation>
+					<xs:documentation>Masters degree thesis</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>Diplomarbeit</xs:documentation>
+					<xs:documentation>Diploma thesis</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List73">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 73">Website role</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="00">
+				<xs:annotation>
+					<xs:documentation>Unspecified, see website description</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Publisher’s corporate website</xs:documentation>
+					<xs:documentation>See also codes 17 and 18</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Publisher’s website for a specified work</xs:documentation>
+					<xs:documentation>A publisher’s informative and/or promotional webpage relating to a specified work (book, journal, online resource or other publication type)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>Online hosting service home page</xs:documentation>
+					<xs:documentation>A webpage giving access to an online content hosting service as a whole</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Journal home page</xs:documentation>
+					<xs:documentation>A webpage giving general information about a journal title, in print or electronic format or both.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>Online journal 'available contents' page</xs:documentation>
+					<xs:documentation>A webpage giving direct access to the content that is available online for a specified journal title version.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>Contributor’s own website</xs:documentation>
+					<xs:documentation>A webpage maintained by an author or other contributor about her/his publications and personal background</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="07">
+				<xs:annotation>
+					<xs:documentation>Publisher’s website relating to specified contributor</xs:documentation>
+					<xs:documentation>A publisher’s webpage devoted to a specific author or other contributor</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="08">
+				<xs:annotation>
+					<xs:documentation>Other publisher’s website relating to specified contributor</xs:documentation>
+					<xs:documentation>A webpage devoted to a specific author or other contributor, and maintained by a publisher other than the publisher of the item described in the ONIX record</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="09">
+				<xs:annotation>
+					<xs:documentation>Third-party website relating to specified contributor</xs:documentation>
+					<xs:documentation>A webpage devoted to a specific author or other contributor, and maintained by a third party (eg a fan site)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="10">
+				<xs:annotation>
+					<xs:documentation>Contributor’s own website for specified work</xs:documentation>
+					<xs:documentation>A webpage maintained by an author or other contributor and specific to an individual work</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="11">
+				<xs:annotation>
+					<xs:documentation>Other publisher’s website relating to specified work</xs:documentation>
+					<xs:documentation>A webpage devoted to an individual work, and maintained by a publisher other than the publisher of the item described in the ONIX record</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="12">
+				<xs:annotation>
+					<xs:documentation>Third-party website relating to specified work</xs:documentation>
+					<xs:documentation>A webpage devoted to an individual work, and maintained by a third party (eg a fan site)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="13">
+				<xs:annotation>
+					<xs:documentation>Contributor’s own website for group or series of works</xs:documentation>
+					<xs:documentation>A webpage maintained by an author or other contributor and specific to a group or series of works</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="14">
+				<xs:annotation>
+					<xs:documentation>Publisher’s website relating to group or series of works</xs:documentation>
+					<xs:documentation>A publisher’s webpage devoted to a group or series of works</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="15">
+				<xs:annotation>
+					<xs:documentation>Other publisher’s website relating to group or series of works</xs:documentation>
+					<xs:documentation>A webpage devoted to a group or series of works, and maintained by a publisher other than the publisher of the item described in the ONIX record</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="16">
+				<xs:annotation>
+					<xs:documentation>Third-party website relating to group or series of works (eg a fan site)</xs:documentation>
+					<xs:documentation>A webpage devoted to a group or series of works, and maintained by a third party (eg a fan site)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="17">
+				<xs:annotation>
+					<xs:documentation>Publisher’s B2B website</xs:documentation>
+					<xs:documentation>Use instead of code 01 to specify a publisher’s website for trade users</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="18">
+				<xs:annotation>
+					<xs:documentation>Publisher’s B2C website</xs:documentation>
+					<xs:documentation>Use instead of code 01 to specify a publisher’s website for consumers</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List74">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 74">Language code - ISO 639-2/B</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="aar">
+				<xs:annotation>
+					<xs:documentation>Afar</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="abk">
+				<xs:annotation>
+					<xs:documentation>Abkhaz</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ace">
+				<xs:annotation>
+					<xs:documentation>Achinese</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ach">
+				<xs:annotation>
+					<xs:documentation>Acoli</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ada">
+				<xs:annotation>
+					<xs:documentation>Adangme</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ady">
+				<xs:annotation>
+					<xs:documentation>Adygei</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="afa">
+				<xs:annotation>
+					<xs:documentation>Afroasiatic (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="afh">
+				<xs:annotation>
+					<xs:documentation>Afrihili (Artificial language)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="afr">
+				<xs:annotation>
+					<xs:documentation>Afrikaans</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ain">
+				<xs:annotation>
+					<xs:documentation>Ainu</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="aka">
+				<xs:annotation>
+					<xs:documentation>Akan</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="akk">
+				<xs:annotation>
+					<xs:documentation>Akkadian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="alb">
+				<xs:annotation>
+					<xs:documentation>Albanian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ale">
+				<xs:annotation>
+					<xs:documentation>Aleut</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="alg">
+				<xs:annotation>
+					<xs:documentation>Algonquian (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="alt">
+				<xs:annotation>
+					<xs:documentation>Southern Altai</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="amh">
+				<xs:annotation>
+					<xs:documentation>Amharic</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ang">
+				<xs:annotation>
+					<xs:documentation>English, Old (ca. 450-1100)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="apa">
+				<xs:annotation>
+					<xs:documentation>Apache languages</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ara">
+				<xs:annotation>
+					<xs:documentation>Arabic</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="arc">
+				<xs:annotation>
+					<xs:documentation>Aramaic</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="arg">
+				<xs:annotation>
+					<xs:documentation>Aragonese Spanish</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="arm">
+				<xs:annotation>
+					<xs:documentation>Armenian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="arn">
+				<xs:annotation>
+					<xs:documentation>Mapuche</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="arp">
+				<xs:annotation>
+					<xs:documentation>Arapaho</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="art">
+				<xs:annotation>
+					<xs:documentation>Artificial (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="arw">
+				<xs:annotation>
+					<xs:documentation>Arawak</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="asm">
+				<xs:annotation>
+					<xs:documentation>Assamese</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ast">
+				<xs:annotation>
+					<xs:documentation>Bable</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ath">
+				<xs:annotation>
+					<xs:documentation>Athapascan (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="aus">
+				<xs:annotation>
+					<xs:documentation>Australian languages</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ava">
+				<xs:annotation>
+					<xs:documentation>Avaric</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ave">
+				<xs:annotation>
+					<xs:documentation>Avestan</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="awa">
+				<xs:annotation>
+					<xs:documentation>Awadhi</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="aym">
+				<xs:annotation>
+					<xs:documentation>Aymara</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="aze">
+				<xs:annotation>
+					<xs:documentation>Azerbaijani</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="bad">
+				<xs:annotation>
+					<xs:documentation>Banda</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="bai">
+				<xs:annotation>
+					<xs:documentation>Bamileke languages</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="bak">
+				<xs:annotation>
+					<xs:documentation>Bashkir</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="bal">
+				<xs:annotation>
+					<xs:documentation>Baluchi</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="bam">
+				<xs:annotation>
+					<xs:documentation>Bambara</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ban">
+				<xs:annotation>
+					<xs:documentation>Balinese</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="baq">
+				<xs:annotation>
+					<xs:documentation>Basque</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="bas">
+				<xs:annotation>
+					<xs:documentation>Basa</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="bat">
+				<xs:annotation>
+					<xs:documentation>Baltic (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="bej">
+				<xs:annotation>
+					<xs:documentation>Beja</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="bel">
+				<xs:annotation>
+					<xs:documentation>Belarusian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="bem">
+				<xs:annotation>
+					<xs:documentation>Bemba</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ben">
+				<xs:annotation>
+					<xs:documentation>Bengali</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ber">
+				<xs:annotation>
+					<xs:documentation>Berber (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="bho">
+				<xs:annotation>
+					<xs:documentation>Bhojpuri</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="bih">
+				<xs:annotation>
+					<xs:documentation>Bihari</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="bik">
+				<xs:annotation>
+					<xs:documentation>Bikol</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="bin">
+				<xs:annotation>
+					<xs:documentation>Bini</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="bis">
+				<xs:annotation>
+					<xs:documentation>Bislama</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="bla">
+				<xs:annotation>
+					<xs:documentation>Siksika</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="bnt">
+				<xs:annotation>
+					<xs:documentation>Bantu (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="bos">
+				<xs:annotation>
+					<xs:documentation>Bosnian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="bra">
+				<xs:annotation>
+					<xs:documentation>Braj</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="bre">
+				<xs:annotation>
+					<xs:documentation>Breton</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="btk">
+				<xs:annotation>
+					<xs:documentation>Batak</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="bua">
+				<xs:annotation>
+					<xs:documentation>Buriat</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="bug">
+				<xs:annotation>
+					<xs:documentation>Bugis</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="bul">
+				<xs:annotation>
+					<xs:documentation>Bulgarian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="bur">
+				<xs:annotation>
+					<xs:documentation>Burmese</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="byn">
+				<xs:annotation>
+					<xs:documentation>Blin; Bilin</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="cad">
+				<xs:annotation>
+					<xs:documentation>Caddo</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="cai">
+				<xs:annotation>
+					<xs:documentation>Central American Indian (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="car">
+				<xs:annotation>
+					<xs:documentation>Carib</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="cat">
+				<xs:annotation>
+					<xs:documentation>Catalan</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="cau">
+				<xs:annotation>
+					<xs:documentation>Caucasian (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ceb">
+				<xs:annotation>
+					<xs:documentation>Cebuano</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="cel">
+				<xs:annotation>
+					<xs:documentation>Celtic (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="cha">
+				<xs:annotation>
+					<xs:documentation>Chamorro</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="chb">
+				<xs:annotation>
+					<xs:documentation>Chibcha</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="che">
+				<xs:annotation>
+					<xs:documentation>Chechen</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="chg">
+				<xs:annotation>
+					<xs:documentation>Chagatai</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="chi">
+				<xs:annotation>
+					<xs:documentation>Chinese</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="chk">
+				<xs:annotation>
+					<xs:documentation>Truk</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="chm">
+				<xs:annotation>
+					<xs:documentation>Mari</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="chn">
+				<xs:annotation>
+					<xs:documentation>Chinook jargon</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="cho">
+				<xs:annotation>
+					<xs:documentation>Choctaw</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="chp">
+				<xs:annotation>
+					<xs:documentation>Chipewyan</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="chr">
+				<xs:annotation>
+					<xs:documentation>Cherokee</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="chu">
+				<xs:annotation>
+					<xs:documentation>Church Slavic</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="chv">
+				<xs:annotation>
+					<xs:documentation>Chuvash</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="chy">
+				<xs:annotation>
+					<xs:documentation>Cheyenne</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="cmc">
+				<xs:annotation>
+					<xs:documentation>Chamic languages</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="cop">
+				<xs:annotation>
+					<xs:documentation>Coptic</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="cor">
+				<xs:annotation>
+					<xs:documentation>Cornish</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="cos">
+				<xs:annotation>
+					<xs:documentation>Corsican</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="cpe">
+				<xs:annotation>
+					<xs:documentation>Creoles and Pidgins, English-based (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="cpf">
+				<xs:annotation>
+					<xs:documentation>Creoles and Pidgins, French-based (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="cpp">
+				<xs:annotation>
+					<xs:documentation>Creoles and Pidgins, Portuguese-based (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="cre">
+				<xs:annotation>
+					<xs:documentation>Cree</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="crh">
+				<xs:annotation>
+					<xs:documentation>Crimean Turkish; Crimean Tatar</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="crp">
+				<xs:annotation>
+					<xs:documentation>Creoles and Pidgins (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="csb">
+				<xs:annotation>
+					<xs:documentation>Kashubian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="cus">
+				<xs:annotation>
+					<xs:documentation>Cushitic (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="cze">
+				<xs:annotation>
+					<xs:documentation>Czech</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="dak">
+				<xs:annotation>
+					<xs:documentation>Dakota</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="dan">
+				<xs:annotation>
+					<xs:documentation>Danish</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="dar">
+				<xs:annotation>
+					<xs:documentation>Dargwa</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="day">
+				<xs:annotation>
+					<xs:documentation>Dayak</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="del">
+				<xs:annotation>
+					<xs:documentation>Delaware</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="den">
+				<xs:annotation>
+					<xs:documentation>Slave</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="dgr">
+				<xs:annotation>
+					<xs:documentation>Dogrib</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="din">
+				<xs:annotation>
+					<xs:documentation>Dinka</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="div">
+				<xs:annotation>
+					<xs:documentation>Divehi</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="doi">
+				<xs:annotation>
+					<xs:documentation>Dogri</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="dra">
+				<xs:annotation>
+					<xs:documentation>Dravidian (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="dsb">
+				<xs:annotation>
+					<xs:documentation>Lower Sorbian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="dua">
+				<xs:annotation>
+					<xs:documentation>Duala</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="dum">
+				<xs:annotation>
+					<xs:documentation>Dutch, Middle (ca. 1050-1350)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="dut">
+				<xs:annotation>
+					<xs:documentation>Dutch</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="dyu">
+				<xs:annotation>
+					<xs:documentation>Dyula</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="dzo">
+				<xs:annotation>
+					<xs:documentation>Dzongkha</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="efi">
+				<xs:annotation>
+					<xs:documentation>Efik</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="egy">
+				<xs:annotation>
+					<xs:documentation>Egyptian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="eka">
+				<xs:annotation>
+					<xs:documentation>Ekajuk</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="elx">
+				<xs:annotation>
+					<xs:documentation>Elamite</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="eng">
+				<xs:annotation>
+					<xs:documentation>English</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="enm">
+				<xs:annotation>
+					<xs:documentation>English, Middle (1100-1500)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="epo">
+				<xs:annotation>
+					<xs:documentation>Esperanto</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="est">
+				<xs:annotation>
+					<xs:documentation>Estonian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ewe">
+				<xs:annotation>
+					<xs:documentation>Ewe</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ewo">
+				<xs:annotation>
+					<xs:documentation>Ewondo</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="fan">
+				<xs:annotation>
+					<xs:documentation>Fang</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="fao">
+				<xs:annotation>
+					<xs:documentation>Faroese</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="fat">
+				<xs:annotation>
+					<xs:documentation>Fanti</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="fij">
+				<xs:annotation>
+					<xs:documentation>Fijian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="fil">
+				<xs:annotation>
+					<xs:documentation>Filipino; Pilipino</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="fin">
+				<xs:annotation>
+					<xs:documentation>Finnish</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="fiu">
+				<xs:annotation>
+					<xs:documentation>Finno-Ugrian (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="fon">
+				<xs:annotation>
+					<xs:documentation>Fon</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="fre">
+				<xs:annotation>
+					<xs:documentation>French</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="frm">
+				<xs:annotation>
+					<xs:documentation>French, Middle (ca. 1400-1600)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="fro">
+				<xs:annotation>
+					<xs:documentation>French, Old (ca. 842-1400)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="fry">
+				<xs:annotation>
+					<xs:documentation>Frisian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ful">
+				<xs:annotation>
+					<xs:documentation>Fula</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="fur">
+				<xs:annotation>
+					<xs:documentation>Friulian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="gaa">
+				<xs:annotation>
+					<xs:documentation>Gã</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="gay">
+				<xs:annotation>
+					<xs:documentation>Gayo</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="gba">
+				<xs:annotation>
+					<xs:documentation>Gbaya</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="gem">
+				<xs:annotation>
+					<xs:documentation>Germanic (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="geo">
+				<xs:annotation>
+					<xs:documentation>Georgian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ger">
+				<xs:annotation>
+					<xs:documentation>German</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="gez">
+				<xs:annotation>
+					<xs:documentation>Ethiopic</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="gil">
+				<xs:annotation>
+					<xs:documentation>Gilbertese</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="gla">
+				<xs:annotation>
+					<xs:documentation>Scottish Gaelic</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="gle">
+				<xs:annotation>
+					<xs:documentation>Irish</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="glg">
+				<xs:annotation>
+					<xs:documentation>Galician</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="glv">
+				<xs:annotation>
+					<xs:documentation>Manx</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="gmh">
+				<xs:annotation>
+					<xs:documentation>German, Middle High (ca. 1050-1500)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="goh">
+				<xs:annotation>
+					<xs:documentation>German, Old High (ca. 750-1050)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="gon">
+				<xs:annotation>
+					<xs:documentation>Gondi</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="gor">
+				<xs:annotation>
+					<xs:documentation>Gorontalo</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="got">
+				<xs:annotation>
+					<xs:documentation>Gothic</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="grb">
+				<xs:annotation>
+					<xs:documentation>Grebo</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="grc">
+				<xs:annotation>
+					<xs:documentation>Greek, Ancient (to 1453)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="gre">
+				<xs:annotation>
+					<xs:documentation>Greek, Modern (1453-)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="grn">
+				<xs:annotation>
+					<xs:documentation>Guarani</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="guj">
+				<xs:annotation>
+					<xs:documentation>Gujarati</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="gwi">
+				<xs:annotation>
+					<xs:documentation>Gwich'in</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="hai">
+				<xs:annotation>
+					<xs:documentation>Haida</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="hat">
+				<xs:annotation>
+					<xs:documentation>Haitian French Creole</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="hau">
+				<xs:annotation>
+					<xs:documentation>Hausa</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="haw">
+				<xs:annotation>
+					<xs:documentation>Hawaiian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="heb">
+				<xs:annotation>
+					<xs:documentation>Hebrew</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="her">
+				<xs:annotation>
+					<xs:documentation>Herero</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="hil">
+				<xs:annotation>
+					<xs:documentation>Hiligaynon</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="him">
+				<xs:annotation>
+					<xs:documentation>Himachali</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="hin">
+				<xs:annotation>
+					<xs:documentation>Hindi</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="hit">
+				<xs:annotation>
+					<xs:documentation>Hittite</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="hmn">
+				<xs:annotation>
+					<xs:documentation>Hmong</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="hmo">
+				<xs:annotation>
+					<xs:documentation>Hiri Motu</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="hsb">
+				<xs:annotation>
+					<xs:documentation>Upper Sorbian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="hun">
+				<xs:annotation>
+					<xs:documentation>Hungarian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="hup">
+				<xs:annotation>
+					<xs:documentation>Hupa</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="iba">
+				<xs:annotation>
+					<xs:documentation>Iban</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ibo">
+				<xs:annotation>
+					<xs:documentation>Igbo</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ice">
+				<xs:annotation>
+					<xs:documentation>Icelandic</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ido">
+				<xs:annotation>
+					<xs:documentation>Ido</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="iii">
+				<xs:annotation>
+					<xs:documentation>Sichuan Yi</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ijo">
+				<xs:annotation>
+					<xs:documentation>Ijo</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="iku">
+				<xs:annotation>
+					<xs:documentation>Inuktitut</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ile">
+				<xs:annotation>
+					<xs:documentation>Interlingue</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ilo">
+				<xs:annotation>
+					<xs:documentation>Iloko</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ina">
+				<xs:annotation>
+					<xs:documentation>Interlingua (International Auxiliary Language Association)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="inc">
+				<xs:annotation>
+					<xs:documentation>Indic (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ind">
+				<xs:annotation>
+					<xs:documentation>Indonesian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ine">
+				<xs:annotation>
+					<xs:documentation>Indo-European (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="inh">
+				<xs:annotation>
+					<xs:documentation>Ingush</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ipk">
+				<xs:annotation>
+					<xs:documentation>Inupiaq</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ira">
+				<xs:annotation>
+					<xs:documentation>Iranian (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="iro">
+				<xs:annotation>
+					<xs:documentation>Iroquoian (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ita">
+				<xs:annotation>
+					<xs:documentation>Italian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="jav">
+				<xs:annotation>
+					<xs:documentation>Javanese</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="jbo">
+				<xs:annotation>
+					<xs:documentation>Lojban</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="jpn">
+				<xs:annotation>
+					<xs:documentation>Japanese</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="jpr">
+				<xs:annotation>
+					<xs:documentation>Judeo-Persian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="jrb">
+				<xs:annotation>
+					<xs:documentation>Judeo-Arabic</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="kaa">
+				<xs:annotation>
+					<xs:documentation>Kara-Kalpak</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="kab">
+				<xs:annotation>
+					<xs:documentation>Kabyle</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="kac">
+				<xs:annotation>
+					<xs:documentation>Kachin</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="kal">
+				<xs:annotation>
+					<xs:documentation>Kalâtdlisut</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="kam">
+				<xs:annotation>
+					<xs:documentation>Kamba</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="kan">
+				<xs:annotation>
+					<xs:documentation>Kannada</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="kar">
+				<xs:annotation>
+					<xs:documentation>Karen</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="kas">
+				<xs:annotation>
+					<xs:documentation>Kashmiri</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="kau">
+				<xs:annotation>
+					<xs:documentation>Kanuri</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="kaw">
+				<xs:annotation>
+					<xs:documentation>Kawi</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="kaz">
+				<xs:annotation>
+					<xs:documentation>Kazakh</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="kbd">
+				<xs:annotation>
+					<xs:documentation>Kabardian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="kha">
+				<xs:annotation>
+					<xs:documentation>Khasi</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="khi">
+				<xs:annotation>
+					<xs:documentation>Khoisan (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="khm">
+				<xs:annotation>
+					<xs:documentation>Khmer</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="kho">
+				<xs:annotation>
+					<xs:documentation>Khotanese</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="kik">
+				<xs:annotation>
+					<xs:documentation>Kikuyu</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="kin">
+				<xs:annotation>
+					<xs:documentation>Kinyarwanda</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="kir">
+				<xs:annotation>
+					<xs:documentation>Kyrgyz</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="kmb">
+				<xs:annotation>
+					<xs:documentation>Kimbundu</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="kok">
+				<xs:annotation>
+					<xs:documentation>Konkani</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="kom">
+				<xs:annotation>
+					<xs:documentation>Komi</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="kon">
+				<xs:annotation>
+					<xs:documentation>Kongo</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="kor">
+				<xs:annotation>
+					<xs:documentation>Korean</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="kos">
+				<xs:annotation>
+					<xs:documentation>Kusaie</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="kpe">
+				<xs:annotation>
+					<xs:documentation>Kpelle</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="krc">
+				<xs:annotation>
+					<xs:documentation>Karachay-Balkar</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="kro">
+				<xs:annotation>
+					<xs:documentation>Kru</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="kru">
+				<xs:annotation>
+					<xs:documentation>Kurukh</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="kua">
+				<xs:annotation>
+					<xs:documentation>Kuanyama</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="kum">
+				<xs:annotation>
+					<xs:documentation>Kumyk</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="kur">
+				<xs:annotation>
+					<xs:documentation>Kurdish</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="kut">
+				<xs:annotation>
+					<xs:documentation>Kutenai</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="lad">
+				<xs:annotation>
+					<xs:documentation>Ladino</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="lah">
+				<xs:annotation>
+					<xs:documentation>Lahnda</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="lam">
+				<xs:annotation>
+					<xs:documentation>Lamba</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="lao">
+				<xs:annotation>
+					<xs:documentation>Lao</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="lat">
+				<xs:annotation>
+					<xs:documentation>Latin</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="lav">
+				<xs:annotation>
+					<xs:documentation>Latvian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="lez">
+				<xs:annotation>
+					<xs:documentation>Lezgian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="lim">
+				<xs:annotation>
+					<xs:documentation>Limburgish</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="lin">
+				<xs:annotation>
+					<xs:documentation>Lingala</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="lit">
+				<xs:annotation>
+					<xs:documentation>Lithuanian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="lol">
+				<xs:annotation>
+					<xs:documentation>Mongo-Nkundu</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="loz">
+				<xs:annotation>
+					<xs:documentation>Lozi</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ltz">
+				<xs:annotation>
+					<xs:documentation>Letzeburgesch</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="lua">
+				<xs:annotation>
+					<xs:documentation>Luba-Lulua</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="lub">
+				<xs:annotation>
+					<xs:documentation>Luba-Katanga</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="lug">
+				<xs:annotation>
+					<xs:documentation>Ganda</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="lui">
+				<xs:annotation>
+					<xs:documentation>Luiseño</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="lun">
+				<xs:annotation>
+					<xs:documentation>Lunda</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="luo">
+				<xs:annotation>
+					<xs:documentation>Luo (Kenya and Tanzania)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="lus">
+				<xs:annotation>
+					<xs:documentation>Lushai</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mac">
+				<xs:annotation>
+					<xs:documentation>Macedonian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mad">
+				<xs:annotation>
+					<xs:documentation>Madurese</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mag">
+				<xs:annotation>
+					<xs:documentation>Magahi</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mah">
+				<xs:annotation>
+					<xs:documentation>Marshall</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mai">
+				<xs:annotation>
+					<xs:documentation>Maithili</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mak">
+				<xs:annotation>
+					<xs:documentation>Makasar</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mal">
+				<xs:annotation>
+					<xs:documentation>Malayalam</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="man">
+				<xs:annotation>
+					<xs:documentation>Mandingo</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mao">
+				<xs:annotation>
+					<xs:documentation>Maori</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="map">
+				<xs:annotation>
+					<xs:documentation>Austronesian (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mar">
+				<xs:annotation>
+					<xs:documentation>Marathi</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mas">
+				<xs:annotation>
+					<xs:documentation>Masai</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="may">
+				<xs:annotation>
+					<xs:documentation>Malay</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mdf">
+				<xs:annotation>
+					<xs:documentation>Moksha</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mdr">
+				<xs:annotation>
+					<xs:documentation>Mandar</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="men">
+				<xs:annotation>
+					<xs:documentation>Mende</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mga">
+				<xs:annotation>
+					<xs:documentation>Irish, Middle (ca. 1100-1550)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mic">
+				<xs:annotation>
+					<xs:documentation>Micmac</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="min">
+				<xs:annotation>
+					<xs:documentation>Minangkabau</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mis">
+				<xs:annotation>
+					<xs:documentation>Miscellaneous languages</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mkh">
+				<xs:annotation>
+					<xs:documentation>Mon-Khmer (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mlg">
+				<xs:annotation>
+					<xs:documentation>Malagasy</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mlt">
+				<xs:annotation>
+					<xs:documentation>Maltese</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mnc">
+				<xs:annotation>
+					<xs:documentation>Manchu</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mni">
+				<xs:annotation>
+					<xs:documentation>Manipuri</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mno">
+				<xs:annotation>
+					<xs:documentation>Manobo languages</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="moh">
+				<xs:annotation>
+					<xs:documentation>Mohawk</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mol">
+				<xs:annotation>
+					<xs:documentation>Moldavian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mon">
+				<xs:annotation>
+					<xs:documentation>Mongolian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mos">
+				<xs:annotation>
+					<xs:documentation>Mooré</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mul">
+				<xs:annotation>
+					<xs:documentation>Multiple languages</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mun">
+				<xs:annotation>
+					<xs:documentation>Munda (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mus">
+				<xs:annotation>
+					<xs:documentation>Creek</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mwl">
+				<xs:annotation>
+					<xs:documentation>Mirandese</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mwr">
+				<xs:annotation>
+					<xs:documentation>Marwari</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="myn">
+				<xs:annotation>
+					<xs:documentation>Mayan languages</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="myv">
+				<xs:annotation>
+					<xs:documentation>Erzya</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="nah">
+				<xs:annotation>
+					<xs:documentation>Nahuatl</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="nai">
+				<xs:annotation>
+					<xs:documentation>North American Indian (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="nap">
+				<xs:annotation>
+					<xs:documentation>Neapolitan Italian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="nau">
+				<xs:annotation>
+					<xs:documentation>Nauru</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="nav">
+				<xs:annotation>
+					<xs:documentation>Navajo</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="nbl">
+				<xs:annotation>
+					<xs:documentation>Ndebele (South Africa)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="nde">
+				<xs:annotation>
+					<xs:documentation>Ndebele (Zimbabwe)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ndo">
+				<xs:annotation>
+					<xs:documentation>Ndonga</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="nds">
+				<xs:annotation>
+					<xs:documentation>Low German</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="nep">
+				<xs:annotation>
+					<xs:documentation>Nepali</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="new">
+				<xs:annotation>
+					<xs:documentation>Newari</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="nia">
+				<xs:annotation>
+					<xs:documentation>Nias</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="nic">
+				<xs:annotation>
+					<xs:documentation>Niger-Kordofanian (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="niu">
+				<xs:annotation>
+					<xs:documentation>Niuean</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="nno">
+				<xs:annotation>
+					<xs:documentation>Norwegian Nynorsk</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="nob">
+				<xs:annotation>
+					<xs:documentation>Norwegian Bokmål</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="nog">
+				<xs:annotation>
+					<xs:documentation>Nogai</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="non">
+				<xs:annotation>
+					<xs:documentation>Old Norse</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="nor">
+				<xs:annotation>
+					<xs:documentation>Norwegian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="nso">
+				<xs:annotation>
+					<xs:documentation>Northern Sotho</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="nub">
+				<xs:annotation>
+					<xs:documentation>Nubian languages</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="nwc">
+				<xs:annotation>
+					<xs:documentation>Classical Newari; Old Newari</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="nya">
+				<xs:annotation>
+					<xs:documentation>Nyanja</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="nym">
+				<xs:annotation>
+					<xs:documentation>Nyamwezi</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="nyn">
+				<xs:annotation>
+					<xs:documentation>Nyankole</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="nyo">
+				<xs:annotation>
+					<xs:documentation>Nyoro</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="nzi">
+				<xs:annotation>
+					<xs:documentation>Nzima</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="oci">
+				<xs:annotation>
+					<xs:documentation>Occitan (post-1500)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="oji">
+				<xs:annotation>
+					<xs:documentation>Ojibwa</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ori">
+				<xs:annotation>
+					<xs:documentation>Oriya</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="orm">
+				<xs:annotation>
+					<xs:documentation>Oromo</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="osa">
+				<xs:annotation>
+					<xs:documentation>Osage</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="oss">
+				<xs:annotation>
+					<xs:documentation>Ossetic</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ota">
+				<xs:annotation>
+					<xs:documentation>Turkish, Ottoman</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="oto">
+				<xs:annotation>
+					<xs:documentation>Otomian languages</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="paa">
+				<xs:annotation>
+					<xs:documentation>Papuan (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="pag">
+				<xs:annotation>
+					<xs:documentation>Pangasinan</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="pal">
+				<xs:annotation>
+					<xs:documentation>Pahlavi</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="pam">
+				<xs:annotation>
+					<xs:documentation>Pampanga</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="pan">
+				<xs:annotation>
+					<xs:documentation>Panjabi</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="pap">
+				<xs:annotation>
+					<xs:documentation>Papiamento</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="pau">
+				<xs:annotation>
+					<xs:documentation>Palauan</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="peo">
+				<xs:annotation>
+					<xs:documentation>Old Persian (ca. 600-400 B.C.)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="per">
+				<xs:annotation>
+					<xs:documentation>Persian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="phi">
+				<xs:annotation>
+					<xs:documentation>Philippine (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="phn">
+				<xs:annotation>
+					<xs:documentation>Phoenician</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="pli">
+				<xs:annotation>
+					<xs:documentation>Pali</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="pol">
+				<xs:annotation>
+					<xs:documentation>Polish</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="pon">
+				<xs:annotation>
+					<xs:documentation>Ponape</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="por">
+				<xs:annotation>
+					<xs:documentation>Portuguese</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="pra">
+				<xs:annotation>
+					<xs:documentation>Prakrit languages</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="pro">
+				<xs:annotation>
+					<xs:documentation>Provençal (to 1500)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="pus">
+				<xs:annotation>
+					<xs:documentation>Pushto</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="qar">
+				<xs:annotation>
+					<xs:documentation>Aranés</xs:documentation>
+					<xs:documentation>ONIX local code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="qav">
+				<xs:annotation>
+					<xs:documentation>Valencian</xs:documentation>
+					<xs:documentation>ONIX local code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="que">
+				<xs:annotation>
+					<xs:documentation>Quechua</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="raj">
+				<xs:annotation>
+					<xs:documentation>Rajasthani</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="rap">
+				<xs:annotation>
+					<xs:documentation>Rapanui</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="rar">
+				<xs:annotation>
+					<xs:documentation>Rarotongan</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="roa">
+				<xs:annotation>
+					<xs:documentation>Romance (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="roh">
+				<xs:annotation>
+					<xs:documentation>Raeto-Romance</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="rom">
+				<xs:annotation>
+					<xs:documentation>Romany</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="rum">
+				<xs:annotation>
+					<xs:documentation>Romanian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="run">
+				<xs:annotation>
+					<xs:documentation>Rundi</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="rup">
+				<xs:annotation>
+					<xs:documentation>Aromanian; Arumanian; Macedo-Romanian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="rus">
+				<xs:annotation>
+					<xs:documentation>Russian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="sad">
+				<xs:annotation>
+					<xs:documentation>Sandawe</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="sag">
+				<xs:annotation>
+					<xs:documentation>Sango</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="sah">
+				<xs:annotation>
+					<xs:documentation>Yakut</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="sai">
+				<xs:annotation>
+					<xs:documentation>South American Indian (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="sal">
+				<xs:annotation>
+					<xs:documentation>Salishan languages</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="sam">
+				<xs:annotation>
+					<xs:documentation>Samaritan Aramaic</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="san">
+				<xs:annotation>
+					<xs:documentation>Sanskrit</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="sas">
+				<xs:annotation>
+					<xs:documentation>Sasak</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="sat">
+				<xs:annotation>
+					<xs:documentation>Santali</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="scc">
+				<xs:annotation>
+					<xs:documentation>Serbian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="scn">
+				<xs:annotation>
+					<xs:documentation>Sicilian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="sco">
+				<xs:annotation>
+					<xs:documentation>Scots</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="scr">
+				<xs:annotation>
+					<xs:documentation>Croatian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="sel">
+				<xs:annotation>
+					<xs:documentation>Selkup</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="sem">
+				<xs:annotation>
+					<xs:documentation>Semitic (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="sga">
+				<xs:annotation>
+					<xs:documentation>Irish, Old (to 1100)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="sgn">
+				<xs:annotation>
+					<xs:documentation>Sign languages</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="shn">
+				<xs:annotation>
+					<xs:documentation>Shan</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="sid">
+				<xs:annotation>
+					<xs:documentation>Sidamo</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="sin">
+				<xs:annotation>
+					<xs:documentation>Sinhalese</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="sio">
+				<xs:annotation>
+					<xs:documentation>Siouan (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="sit">
+				<xs:annotation>
+					<xs:documentation>Sino-Tibetan (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="sla">
+				<xs:annotation>
+					<xs:documentation>Slavic (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="slo">
+				<xs:annotation>
+					<xs:documentation>Slovak</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="slv">
+				<xs:annotation>
+					<xs:documentation>Slovenian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="sma">
+				<xs:annotation>
+					<xs:documentation>Southern Sami</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="sme">
+				<xs:annotation>
+					<xs:documentation>Northern Sami</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="smi">
+				<xs:annotation>
+					<xs:documentation>Sami</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="smj">
+				<xs:annotation>
+					<xs:documentation>Lule Sami</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="smn">
+				<xs:annotation>
+					<xs:documentation>Inari Sami</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="smo">
+				<xs:annotation>
+					<xs:documentation>Samoan</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="sms">
+				<xs:annotation>
+					<xs:documentation>Skolt Sami</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="sna">
+				<xs:annotation>
+					<xs:documentation>Shona</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="snd">
+				<xs:annotation>
+					<xs:documentation>Sindhi</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="snk">
+				<xs:annotation>
+					<xs:documentation>Soninke</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="sog">
+				<xs:annotation>
+					<xs:documentation>Sogdian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="som">
+				<xs:annotation>
+					<xs:documentation>Somali</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="son">
+				<xs:annotation>
+					<xs:documentation>Songhai</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="sot">
+				<xs:annotation>
+					<xs:documentation>Sotho</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="spa">
+				<xs:annotation>
+					<xs:documentation>Spanish</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="srd">
+				<xs:annotation>
+					<xs:documentation>Sardinian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="srr">
+				<xs:annotation>
+					<xs:documentation>Serer</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ssa">
+				<xs:annotation>
+					<xs:documentation>Nilo-Saharan (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ssw">
+				<xs:annotation>
+					<xs:documentation>Swazi</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="suk">
+				<xs:annotation>
+					<xs:documentation>Sukuma</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="sun">
+				<xs:annotation>
+					<xs:documentation>Sundanese</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="sus">
+				<xs:annotation>
+					<xs:documentation>Susu</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="sux">
+				<xs:annotation>
+					<xs:documentation>Sumerian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="swa">
+				<xs:annotation>
+					<xs:documentation>Swahili</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="swe">
+				<xs:annotation>
+					<xs:documentation>Swedish</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="syr">
+				<xs:annotation>
+					<xs:documentation>Syriac</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="tah">
+				<xs:annotation>
+					<xs:documentation>Tahitian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="tai">
+				<xs:annotation>
+					<xs:documentation>Tai (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="tam">
+				<xs:annotation>
+					<xs:documentation>Tamil</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="tat">
+				<xs:annotation>
+					<xs:documentation>Tatar</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="tel">
+				<xs:annotation>
+					<xs:documentation>Telugu</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="tem">
+				<xs:annotation>
+					<xs:documentation>Temne</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ter">
+				<xs:annotation>
+					<xs:documentation>Terena</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="tet">
+				<xs:annotation>
+					<xs:documentation>Tetum</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="tgk">
+				<xs:annotation>
+					<xs:documentation>Tajik</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="tgl">
+				<xs:annotation>
+					<xs:documentation>Tagalog</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="tha">
+				<xs:annotation>
+					<xs:documentation>Thai</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="tib">
+				<xs:annotation>
+					<xs:documentation>Tibetan</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="tig">
+				<xs:annotation>
+					<xs:documentation>Tigré</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="tir">
+				<xs:annotation>
+					<xs:documentation>Tigrinya</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="tiv">
+				<xs:annotation>
+					<xs:documentation>Tiv</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="tkl">
+				<xs:annotation>
+					<xs:documentation>Tokelauan</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="tlh">
+				<xs:annotation>
+					<xs:documentation>Klingon; tlhIngan-Hol</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="tli">
+				<xs:annotation>
+					<xs:documentation>Tlingit</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="tmh">
+				<xs:annotation>
+					<xs:documentation>Tamashek</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="tog">
+				<xs:annotation>
+					<xs:documentation>Tonga (Nyasa)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ton">
+				<xs:annotation>
+					<xs:documentation>Tongan</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="tpi">
+				<xs:annotation>
+					<xs:documentation>Tok Pisin</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="tsi">
+				<xs:annotation>
+					<xs:documentation>Tsimshian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="tsn">
+				<xs:annotation>
+					<xs:documentation>Tswana</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="tso">
+				<xs:annotation>
+					<xs:documentation>Tsonga</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="tuk">
+				<xs:annotation>
+					<xs:documentation>Turkmen</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="tum">
+				<xs:annotation>
+					<xs:documentation>Tumbuka</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="tup">
+				<xs:annotation>
+					<xs:documentation>Tupi languages</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="tur">
+				<xs:annotation>
+					<xs:documentation>Turkish</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="tut">
+				<xs:annotation>
+					<xs:documentation>Altaic (Other)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="tvl">
+				<xs:annotation>
+					<xs:documentation>Tuvaluan</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="twi">
+				<xs:annotation>
+					<xs:documentation>Twi</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="tyv">
+				<xs:annotation>
+					<xs:documentation>Tuvinian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="udm">
+				<xs:annotation>
+					<xs:documentation>Udmurt</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="uga">
+				<xs:annotation>
+					<xs:documentation>Ugaritic</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="uig">
+				<xs:annotation>
+					<xs:documentation>Uighur</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ukr">
+				<xs:annotation>
+					<xs:documentation>Ukrainian</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="umb">
+				<xs:annotation>
+					<xs:documentation>Umbundu</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="und">
+				<xs:annotation>
+					<xs:documentation>Undetermined</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="urd">
+				<xs:annotation>
+					<xs:documentation>Urdu</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="uzb">
+				<xs:annotation>
+					<xs:documentation>Uzbek</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="vai">
+				<xs:annotation>
+					<xs:documentation>Vai</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ven">
+				<xs:annotation>
+					<xs:documentation>Venda</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="vie">
+				<xs:annotation>
+					<xs:documentation>Vietnamese</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="vol">
+				<xs:annotation>
+					<xs:documentation>Volapük</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="vot">
+				<xs:annotation>
+					<xs:documentation>Votic</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="wak">
+				<xs:annotation>
+					<xs:documentation>Wakashan languages</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="wal">
+				<xs:annotation>
+					<xs:documentation>Walamo</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="war">
+				<xs:annotation>
+					<xs:documentation>Waray</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="was">
+				<xs:annotation>
+					<xs:documentation>Washo</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="wel">
+				<xs:annotation>
+					<xs:documentation>Welsh</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="wen">
+				<xs:annotation>
+					<xs:documentation>Sorbian languages</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="wln">
+				<xs:annotation>
+					<xs:documentation>Walloon</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="wol">
+				<xs:annotation>
+					<xs:documentation>Wolof</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="xal">
+				<xs:annotation>
+					<xs:documentation>Kalmyk</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="xho">
+				<xs:annotation>
+					<xs:documentation>Xhosa</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="yao">
+				<xs:annotation>
+					<xs:documentation>Yao</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="yap">
+				<xs:annotation>
+					<xs:documentation>Yapese</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="yid">
+				<xs:annotation>
+					<xs:documentation>Yiddish</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="yor">
+				<xs:annotation>
+					<xs:documentation>Yoruba</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ypk">
+				<xs:annotation>
+					<xs:documentation>Yupik languages</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="zap">
+				<xs:annotation>
+					<xs:documentation>Zapotec</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="zen">
+				<xs:annotation>
+					<xs:documentation>Zenaga</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="zha">
+				<xs:annotation>
+					<xs:documentation>Zhuang</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="znd">
+				<xs:annotation>
+					<xs:documentation>Zande</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="zul">
+				<xs:annotation>
+					<xs:documentation>Zulu</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="zun">
+				<xs:annotation>
+					<xs:documentation>Zuni</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List75">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 75">Person date role</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="007">
+				<xs:annotation>
+					<xs:documentation>Date of birth</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="008">
+				<xs:annotation>
+					<xs:documentation>Date of death</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List76">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 76">Product form feature value - DVD region codes</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="0">
+				<xs:annotation>
+					<xs:documentation>All regions</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="1">
+				<xs:annotation>
+					<xs:documentation>US &amp; Canada</xs:documentation>
+					<xs:documentation>US, US Territories, Canada</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="2">
+				<xs:annotation>
+					<xs:documentation>Japan, Europe, S Africa, Middle East</xs:documentation>
+					<xs:documentation>Japan, Europe, South Africa and Middle East (including Egypt)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="3">
+				<xs:annotation>
+					<xs:documentation>SE Asia and East Asia</xs:documentation>
+					<xs:documentation>Southeast Asia and East Asia (including Hong Kong)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="4">
+				<xs:annotation>
+					<xs:documentation>Australia, NZ, Pacific Islands, Central America, Mexico, South America, Caribbean</xs:documentation>
+					<xs:documentation>Australia, New Zealand, Pacific Islands, Central America, Mexico, South America and the Caribbean</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="5">
+				<xs:annotation>
+					<xs:documentation>Eastern Europe, Indian subcontinent, Africa, North Korea, Mongolia</xs:documentation>
+					<xs:documentation>Eastern Europe (former Soviet Union), Indian subcontinent, Africa, North Korea and Mongolia</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="6">
+				<xs:annotation>
+					<xs:documentation>China</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="7">
+				<xs:annotation>
+					<xs:documentation>Reserved</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="8">
+				<xs:annotation>
+					<xs:documentation>Special international venues</xs:documentation>
+					<xs:documentation>Planes, cruise ships etc</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List77">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 77">US school or college grade</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="P">
+				<xs:annotation>
+					<xs:documentation>Preschool</xs:documentation>
+					<xs:documentation>Age typically 0-4 years</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="K">
+				<xs:annotation>
+					<xs:documentation>Kindergarten</xs:documentation>
+					<xs:documentation>Age typically 5 years</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="1">
+				<xs:annotation>
+					<xs:documentation>First Grade</xs:documentation>
+					<xs:documentation>Age typically 6 years</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="2">
+				<xs:annotation>
+					<xs:documentation>Second Grade</xs:documentation>
+					<xs:documentation>Age typically 7 years</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="3">
+				<xs:annotation>
+					<xs:documentation>Third Grade</xs:documentation>
+					<xs:documentation>Age typically 8 years</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="4">
+				<xs:annotation>
+					<xs:documentation>Fourth Grade</xs:documentation>
+					<xs:documentation>Age typically 9 years</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="5">
+				<xs:annotation>
+					<xs:documentation>Fifth Grade</xs:documentation>
+					<xs:documentation>Age typically 10 years</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="6">
+				<xs:annotation>
+					<xs:documentation>Sixth Grade</xs:documentation>
+					<xs:documentation>Age typically 11 years</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="7">
+				<xs:annotation>
+					<xs:documentation>Seventh Grade</xs:documentation>
+					<xs:documentation>Age typically 12 years</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="8">
+				<xs:annotation>
+					<xs:documentation>Eighth Grade</xs:documentation>
+					<xs:documentation>Age typically 13 years</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="9">
+				<xs:annotation>
+					<xs:documentation>Ninth Grade</xs:documentation>
+					<xs:documentation>High School Freshman - age typically 14 years</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="10">
+				<xs:annotation>
+					<xs:documentation>Tenth Grade</xs:documentation>
+					<xs:documentation>High School Sophomore - age typically 15 years</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="11">
+				<xs:annotation>
+					<xs:documentation>Eleventh Grade</xs:documentation>
+					<xs:documentation>High School Junior - age typically 16 years</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="12">
+				<xs:annotation>
+					<xs:documentation>Twelfth Grade</xs:documentation>
+					<xs:documentation>High School Senior - age typically 17 years</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="13">
+				<xs:annotation>
+					<xs:documentation>College Freshman</xs:documentation>
+					<xs:documentation>Age typically 18 years</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="14">
+				<xs:annotation>
+					<xs:documentation>College Sophomore</xs:documentation>
+					<xs:documentation>Age typically 19 years</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="15">
+				<xs:annotation>
+					<xs:documentation>College Junior</xs:documentation>
+					<xs:documentation>Age typically 20 years</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="16">
+				<xs:annotation>
+					<xs:documentation>College Senior</xs:documentation>
+					<xs:documentation>Age typically 21 years</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="17">
+				<xs:annotation>
+					<xs:documentation>College Graduate Student</xs:documentation>
+					<xs:documentation>Age typically 22+ years</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List78">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 78">Product form detail</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="A101">
+				<xs:annotation>
+					<xs:documentation>CD standard audio format</xs:documentation>
+					<xs:documentation>CD 'red book' format</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A102">
+				<xs:annotation>
+					<xs:documentation>SACD super audio format</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A103">
+				<xs:annotation>
+					<xs:documentation>MP3 format</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A104">
+				<xs:annotation>
+					<xs:documentation>WAV format</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="A105">
+				<xs:annotation>
+					<xs:documentation>Real Audio format</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B101">
+				<xs:annotation>
+					<xs:documentation>Mass market (rack) paperback</xs:documentation>
+					<xs:documentation>In North America, a category of paperback characterized partly by page size (typically 4¼ x 7 1/8 inches) and partly by target market and terms of trade. Use with Product Form code BC.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B102">
+				<xs:annotation>
+					<xs:documentation>Trade paperback (US)</xs:documentation>
+					<xs:documentation>In North America, a category of paperback characterized partly by page size and partly by target market and terms of trade. AKA 'quality paperback', and including textbooks. Most paperback books sold in North America except 'mass-market' (B101) and 'tall rack' (B107) are correctly described with this code. Use with Product Form code BC.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B103">
+				<xs:annotation>
+					<xs:documentation>Digest format paperback</xs:documentation>
+					<xs:documentation>In North America, a category of paperback characterized by page size and generally used for children's books; use with Product Form code BC. Note: was wrongly shown as B102 (duplicate entry) in Issue 3.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B104">
+				<xs:annotation>
+					<xs:documentation>A-format paperback</xs:documentation>
+					<xs:documentation>In UK, a category of paperback characterized by page size (normally 178 x 111 mm approx); use with Product Form code BC</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B105">
+				<xs:annotation>
+					<xs:documentation>B-format paperback</xs:documentation>
+					<xs:documentation>In UK, a category of paperback characterized by page size (normally 198 x 129 mm approx); use with Product Form code BC</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B106">
+				<xs:annotation>
+					<xs:documentation>Trade paperback (UK)</xs:documentation>
+					<xs:documentation>In UK, a category of paperback characterized partly by size (usually in traditional hardback dimensions), and often used for paperback originals; use with Product Form code BC (replaces 'C-format' from former List 8)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B107">
+				<xs:annotation>
+					<xs:documentation>Tall rack paperback (US)</xs:documentation>
+					<xs:documentation>In North America, a category of paperback characterised partly by page size and partly by target market and terms of trade; use with Product Form code BC</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B108">
+				<xs:annotation>
+					<xs:documentation>A5: Tankobon</xs:documentation>
+					<xs:documentation>Japanese hardcover format</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B109">
+				<xs:annotation>
+					<xs:documentation>B5: Tankobon</xs:documentation>
+					<xs:documentation>Japanese hardcover format</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B110">
+				<xs:annotation>
+					<xs:documentation>B6: Tankobon</xs:documentation>
+					<xs:documentation>Japanese hardcover format</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B111">
+				<xs:annotation>
+					<xs:documentation>A6: Bunko</xs:documentation>
+					<xs:documentation>Japanese paperback format</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B112">
+				<xs:annotation>
+					<xs:documentation>B40-dori: Shinsho</xs:documentation>
+					<xs:documentation>Japanese paperback format</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B201">
+				<xs:annotation>
+					<xs:documentation>Coloring / join-the-dot book</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B202">
+				<xs:annotation>
+					<xs:documentation>Lift-the-flap book</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B203">
+				<xs:annotation>
+					<xs:documentation>Fuzzy book</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B204">
+				<xs:annotation>
+					<xs:documentation>Miniature book</xs:documentation>
+					<xs:documentation>Note: was wrongly shown as B203 (duplicate entry) in Issue 3</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B205">
+				<xs:annotation>
+					<xs:documentation>Moving picture / flicker book</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B206">
+				<xs:annotation>
+					<xs:documentation>Pop-up book</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B207">
+				<xs:annotation>
+					<xs:documentation>Scented / 'smelly' book</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B208">
+				<xs:annotation>
+					<xs:documentation>Sound story / 'noisy' book</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B209">
+				<xs:annotation>
+					<xs:documentation>Sticker book</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B210">
+				<xs:annotation>
+					<xs:documentation>Touch-and-feel book</xs:documentation>
+					<xs:documentation>Incorporating different textures</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B211">
+				<xs:annotation>
+					<xs:documentation>Toy / die-cut book</xs:documentation>
+					<xs:documentation>Cut in a non-standard shape with moving parts or other features that make it function as a toy as well as a book: use with Product Form BK</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B221">
+				<xs:annotation>
+					<xs:documentation>Picture book</xs:documentation>
+					<xs:documentation>Children's picture book: use with applicable Product Form code</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B301">
+				<xs:annotation>
+					<xs:documentation>Loose leaf - sheets &amp; binder</xs:documentation>
+					<xs:documentation>Use with Product Form code BD</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B302">
+				<xs:annotation>
+					<xs:documentation>Loose leaf - binder only</xs:documentation>
+					<xs:documentation>Use with Product Form code BD</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B303">
+				<xs:annotation>
+					<xs:documentation>Loose leaf - sheets only</xs:documentation>
+					<xs:documentation>Use with Product Form code BD</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B304">
+				<xs:annotation>
+					<xs:documentation>Sewn</xs:documentation>
+					<xs:documentation>AKA stitched; for 'saddle-sewn', see code B310</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B305">
+				<xs:annotation>
+					<xs:documentation>Unsewn / adhesive bound</xs:documentation>
+					<xs:documentation>Including 'perfect bound', 'glued'</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B306">
+				<xs:annotation>
+					<xs:documentation>Library binding</xs:documentation>
+					<xs:documentation>Strengthened binding intended for libraries</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B307">
+				<xs:annotation>
+					<xs:documentation>Reinforced binding</xs:documentation>
+					<xs:documentation>Strengthened binding, not specifically intended for libraries</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B308">
+				<xs:annotation>
+					<xs:documentation>Half bound</xs:documentation>
+					<xs:documentation>Must be accompanied by a code specifiying a material, eg 'half-bound real leather'</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B309">
+				<xs:annotation>
+					<xs:documentation>Quarter bound</xs:documentation>
+					<xs:documentation>Must be accompanied by a code specifiying a material, eg 'quarter bound real leather'</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B310">
+				<xs:annotation>
+					<xs:documentation>Saddle-sewn</xs:documentation>
+					<xs:documentation>AKA 'saddle-stitched' or 'wire-stitched'</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B311">
+				<xs:annotation>
+					<xs:documentation>Comb bound</xs:documentation>
+					<xs:documentation>Round or oval plastic forms in a clamp-like configuration: use with code BE from List 7</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B312">
+				<xs:annotation>
+					<xs:documentation>Wire-O</xs:documentation>
+					<xs:documentation>Twin loop metal or plastic spine: use with code BE from List 7</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B313">
+				<xs:annotation>
+					<xs:documentation>Concealed wire</xs:documentation>
+					<xs:documentation>Cased over Wire-O binding: use with code BE from List 7</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B401">
+				<xs:annotation>
+					<xs:documentation>Cloth over boards</xs:documentation>
+					<xs:documentation>AKA fabric, linen over boards</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B402">
+				<xs:annotation>
+					<xs:documentation>Paper over boards</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B403">
+				<xs:annotation>
+					<xs:documentation>Leather, real</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B404">
+				<xs:annotation>
+					<xs:documentation>Leather, imitation</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B405">
+				<xs:annotation>
+					<xs:documentation>Leather, bonded</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B406">
+				<xs:annotation>
+					<xs:documentation>Vellum</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B407">
+				<xs:annotation>
+					<xs:documentation>Plastic</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B408">
+				<xs:annotation>
+					<xs:documentation>Vinyl</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B409">
+				<xs:annotation>
+					<xs:documentation>Cloth</xs:documentation>
+					<xs:documentation>Cloth, not necessarily over boards – cf B401</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B410">
+				<xs:annotation>
+					<xs:documentation>Imitation cloth</xs:documentation>
+					<xs:documentation>Spanish 'simil-tela'</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B501">
+				<xs:annotation>
+					<xs:documentation>With dust jacket</xs:documentation>
+					<xs:documentation>Type unspecified</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B502">
+				<xs:annotation>
+					<xs:documentation>With printed dust jacket</xs:documentation>
+					<xs:documentation>Used to distinguish from B503</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B503">
+				<xs:annotation>
+					<xs:documentation>With translucent dust cover</xs:documentation>
+					<xs:documentation>With translucent paper or plastic protective cover</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B504">
+				<xs:annotation>
+					<xs:documentation>With flaps</xs:documentation>
+					<xs:documentation>For paperback with flaps</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B505">
+				<xs:annotation>
+					<xs:documentation>With thumb index</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B506">
+				<xs:annotation>
+					<xs:documentation>With ribbon marker(s)</xs:documentation>
+					<xs:documentation>If the number of markers is significant, it can be stated as free text in &lt;ProductFormDescription&gt;</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B507">
+				<xs:annotation>
+					<xs:documentation>With zip fastener</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B508">
+				<xs:annotation>
+					<xs:documentation>With button snap fastener</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="B509">
+				<xs:annotation>
+					<xs:documentation>With leather edge lining</xs:documentation>
+					<xs:documentation>AKA yapp edge?</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="D101">
+				<xs:annotation>
+					<xs:documentation>Real Video format</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="D102">
+				<xs:annotation>
+					<xs:documentation>Quicktime format</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="D103">
+				<xs:annotation>
+					<xs:documentation>AVI format</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="D104">
+				<xs:annotation>
+					<xs:documentation>Windows Media format</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="D105">
+				<xs:annotation>
+					<xs:documentation>MPEG-4</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="D201">
+				<xs:annotation>
+					<xs:documentation>MS-DOS</xs:documentation>
+					<xs:documentation>Use with an applicable Product Form code D*</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="D202">
+				<xs:annotation>
+					<xs:documentation>Windows</xs:documentation>
+					<xs:documentation>Use with an applicable Product Form code D*</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="D203">
+				<xs:annotation>
+					<xs:documentation>Macintosh</xs:documentation>
+					<xs:documentation>Use with an applicable Product Form code D*</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="D204">
+				<xs:annotation>
+					<xs:documentation>UNIX / LINUX</xs:documentation>
+					<xs:documentation>Use with an applicable Product Form code D*</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="D205">
+				<xs:annotation>
+					<xs:documentation>Other operating system(s)</xs:documentation>
+					<xs:documentation>Use with an applicable Product Form code D*</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="D206">
+				<xs:annotation>
+					<xs:documentation>Palm OS</xs:documentation>
+					<xs:documentation>Use with an applicable Product Form code D*</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="D207">
+				<xs:annotation>
+					<xs:documentation>Windows Mobile</xs:documentation>
+					<xs:documentation>Use with an applicable Product Form code D*</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="D301">
+				<xs:annotation>
+					<xs:documentation>Microsoft XBox</xs:documentation>
+					<xs:documentation>Use with Product Form code DE or DB as applicable</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="D302">
+				<xs:annotation>
+					<xs:documentation>Nintendo Gameboy Color</xs:documentation>
+					<xs:documentation>Use with Product Form code DE or DB as applicable</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="D303">
+				<xs:annotation>
+					<xs:documentation>Nintendo Gameboy Advanced</xs:documentation>
+					<xs:documentation>Use with Product Form code DE or DB as applicable</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="D304">
+				<xs:annotation>
+					<xs:documentation>Nintendo Gameboy</xs:documentation>
+					<xs:documentation>Use with Product Form code DE or DB as applicable</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="D305">
+				<xs:annotation>
+					<xs:documentation>Nintendo Gamecube</xs:documentation>
+					<xs:documentation>Use with Product Form code DE or DB as applicable</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="D306">
+				<xs:annotation>
+					<xs:documentation>Nintendo 64</xs:documentation>
+					<xs:documentation>Use with Product Form code DE or DB as applicable</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="D307">
+				<xs:annotation>
+					<xs:documentation>Sega Dreamcast</xs:documentation>
+					<xs:documentation>Use with Product Form code DE or DB as applicable</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="D308">
+				<xs:annotation>
+					<xs:documentation>Sega Genesis/Megadrive</xs:documentation>
+					<xs:documentation>Use with Product Form code DE or DB as applicable</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="D309">
+				<xs:annotation>
+					<xs:documentation>Sega Saturn</xs:documentation>
+					<xs:documentation>Use with Product Form code DE or DB as applicable</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="D310">
+				<xs:annotation>
+					<xs:documentation>Sony Playstation 1</xs:documentation>
+					<xs:documentation>Use with Product Form code DE or DB as applicable</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="D311">
+				<xs:annotation>
+					<xs:documentation>Sony Playstation 2</xs:documentation>
+					<xs:documentation>Use with Product Form code DE or DB as applicable</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="D312">
+				<xs:annotation>
+					<xs:documentation>Nintendo Dual Screen</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="P101">
+				<xs:annotation>
+					<xs:documentation>Desk calendar</xs:documentation>
+					<xs:documentation>Use with Product Form code PC</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="P102">
+				<xs:annotation>
+					<xs:documentation>Mini calendar</xs:documentation>
+					<xs:documentation>Use with Product Form code PC</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="P103">
+				<xs:annotation>
+					<xs:documentation>Engagement calendar</xs:documentation>
+					<xs:documentation>Use with Product Form code PC</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="P104">
+				<xs:annotation>
+					<xs:documentation>Day by day calendar</xs:documentation>
+					<xs:documentation>Use with Product Form code PC</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="P105">
+				<xs:annotation>
+					<xs:documentation>Poster calendar</xs:documentation>
+					<xs:documentation>Use with Product Form code PC</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="P106">
+				<xs:annotation>
+					<xs:documentation>Wall calendar</xs:documentation>
+					<xs:documentation>Use with Product Form code PC</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="P107">
+				<xs:annotation>
+					<xs:documentation>Perpetual calendar</xs:documentation>
+					<xs:documentation>Use with Product Form code PC</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="P108">
+				<xs:annotation>
+					<xs:documentation>Advent calendar</xs:documentation>
+					<xs:documentation>Use with Product Form code PC</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="V201">
+				<xs:annotation>
+					<xs:documentation>PAL</xs:documentation>
+					<xs:documentation>TV standard for video or DVD</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="V202">
+				<xs:annotation>
+					<xs:documentation>NTSC</xs:documentation>
+					<xs:documentation>TV standard for video or DVD</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="V203">
+				<xs:annotation>
+					<xs:documentation>SECAM</xs:documentation>
+					<xs:documentation>TV standard for video or DVD</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List79">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 79">Product form feature type</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Color of cover</xs:documentation>
+					<xs:documentation>For Product Form Feature values see code list 98</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Color of page edge</xs:documentation>
+					<xs:documentation>For Product Form Feature values see code list 98</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>Text font</xs:documentation>
+					<xs:documentation>The principal font used for body text, when this is a significant aspect of product description, eg for some Bibles. The accompanying Product Form Feature value is text specifying font size and, if desired, style.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Special cover material</xs:documentation>
+					<xs:documentation>For Product Form Feature values see code list 99</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>DVD region</xs:documentation>
+					<xs:documentation>For Product Form Feature values see code list 76</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List80">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 80">Product packaging type</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Slip-sleeve</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Clamshell</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>Keep case</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>Jewel case</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="09">
+				<xs:annotation>
+					<xs:documentation>In box</xs:documentation>
+					<xs:documentation>Individual item or set in box with lid: not to be confused with the commonly-used 'boxed set' - see below</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="10">
+				<xs:annotation>
+					<xs:documentation>Slip-cased</xs:documentation>
+					<xs:documentation>Slip-case for single item only: German 'Schuber'</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="11">
+				<xs:annotation>
+					<xs:documentation>Slip-cased set</xs:documentation>
+					<xs:documentation>Slip-case for multi-volume set: German 'Kassette'; also commonly referred to as 'boxed set'</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="12">
+				<xs:annotation>
+					<xs:documentation>Tube</xs:documentation>
+					<xs:documentation>Rolled in tube: sheet map or poster</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="13">
+				<xs:annotation>
+					<xs:documentation>Binder</xs:documentation>
+					<xs:documentation>Use for miscellaneous items such as slides, microfiche, when presented in a binder</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="14">
+				<xs:annotation>
+					<xs:documentation>In wallet or folder</xs:documentation>
+					<xs:documentation>Use for miscellaneous items such as slides, microfiche, when presented in a wallet or folder</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List81">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 81">Product content type</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Audiobook</xs:documentation>
+					<xs:documentation>Audio recording of a reading of a book or other text</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Performance - spoken word</xs:documentation>
+					<xs:documentation>Audio recording of a drama or other spoken word performance</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>Music recording</xs:documentation>
+					<xs:documentation>Audio recording of a music performance, including musical drama and opera</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Other audio</xs:documentation>
+					<xs:documentation>Audio recording of other sound, eg birdsong</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>Game</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>Moving images</xs:documentation>
+					<xs:documentation>Film, video etc</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="07">
+				<xs:annotation>
+					<xs:documentation>Still images / graphics</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="08">
+				<xs:annotation>
+					<xs:documentation>Software</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="09">
+				<xs:annotation>
+					<xs:documentation>Data</xs:documentation>
+					<xs:documentation>Data files</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List82">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 82">Bible contents</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="AP">
+				<xs:annotation>
+					<xs:documentation>Apocrypha</xs:documentation>
+					<xs:documentation>The seven portions of the Apocrypha added to the Catholic canon at the Council of Trent in 1546: Tobit; Judith; Wisdom of Solomon; Sirach (Ecclesiasticus); Baruch, including the Letter of Jeremiah; I &amp; II Maccabees; Extra portions of Esther and Daniel (Additions to Esther; the Prayer of Azariah; Song of the Three Jews; Susannah; Bel and the Dragon). These are not generally included in the Protestant canon.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AX">
+				<xs:annotation>
+					<xs:documentation>Additional Apocryphal texts: Greek Orthodox canon</xs:documentation>
+					<xs:documentation>I Esdras; Prayer of Manasseh; Psalm 151; III Maccabees.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AY">
+				<xs:annotation>
+					<xs:documentation>Additional Apocryphal texts: Slavonic Orthodox canon</xs:documentation>
+					<xs:documentation>I &amp; II Esdras; Prayer of Manasseh; Psalm 151; III &amp; IV Maccabees.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AZ">
+				<xs:annotation>
+					<xs:documentation>Additional Apocryphal texts</xs:documentation>
+					<xs:documentation>Additional Apocryphal texts included in some Bible versions: I &amp; II Esdras; Prayer of Manasseh.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GA">
+				<xs:annotation>
+					<xs:documentation>General canon with Apocrypha</xs:documentation>
+					<xs:documentation>The 66 books included in the Protestant, Catholic and Orthodox canons, together with the seven portions of the Apocrypha included in the Catholic canon.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GE">
+				<xs:annotation>
+					<xs:documentation>General canon</xs:documentation>
+					<xs:documentation>The 66 books included in the Protestant, Catholic and Orthodox canons, 39 from the Old Testament and 27 from the New Testament. The sequence of books may differ in different canons.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GS">
+				<xs:annotation>
+					<xs:documentation>Gospels</xs:documentation>
+					<xs:documentation>The books of Matthew, Mark, Luke and John.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="OT">
+				<xs:annotation>
+					<xs:documentation>Old Testament</xs:documentation>
+					<xs:documentation>Those 39 books which were included in the Jewish canon by the rabbinical academy established at Jamma in 90 CE. Also known as the Jewish or Hebrew scriptures.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NT">
+				<xs:annotation>
+					<xs:documentation>New Testament</xs:documentation>
+					<xs:documentation>The 27 books included in the Christian canon through the Easter Letter of Athanasius, Bishop of Alexandria and also by a general council of the Christian church held near the end of the 4th century CE.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NP">
+				<xs:annotation>
+					<xs:documentation>New Testament with Psalms and Proverbs</xs:documentation>
+					<xs:documentation>Includes the 27 books of the New Testament plus Psalms and Proverbs from the Old Testament.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PE">
+				<xs:annotation>
+					<xs:documentation>Paul’s Epistles</xs:documentation>
+					<xs:documentation>The books containing the letters of Paul to the various early Christian churches.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PP">
+				<xs:annotation>
+					<xs:documentation>Psalms and Proverbs</xs:documentation>
+					<xs:documentation>The book of Psalms and the book of Proverbs combined.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PS">
+				<xs:annotation>
+					<xs:documentation>Psalms</xs:documentation>
+					<xs:documentation>The book of Psalms.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PT">
+				<xs:annotation>
+					<xs:documentation>Pentateuch</xs:documentation>
+					<xs:documentation>The first five books of the Bible: Genesis, Exodus, Numbers, Leviticus, Deuteronomy. Also applied to the Torah.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ZZ">
+				<xs:annotation>
+					<xs:documentation>Other portions</xs:documentation>
+					<xs:documentation>Selected books of either the OT or NT not otherwise noted.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List83">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 83">Bible version</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="AMP">
+				<xs:annotation>
+					<xs:documentation>Amplified</xs:documentation>
+					<xs:documentation>A translation based on the American Standard Version and showing multiple options for the translation of ancient text. Published in full in 1965. Sponsored by the Lockman Foundation.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ASV">
+				<xs:annotation>
+					<xs:documentation>American Standard</xs:documentation>
+					<xs:documentation>A 1901 translation using verbal equivalence techniques with the purpose of Americanizing the King James version.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CEV">
+				<xs:annotation>
+					<xs:documentation>Contemporary English</xs:documentation>
+					<xs:documentation>A translation completed in 1995 and sponsored by the American Bible Society under the leadership of Barclay Newman.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="DOU">
+				<xs:annotation>
+					<xs:documentation>Douay-Rheims</xs:documentation>
+					<xs:documentation>An early (1580-1609) English translation from the Latin Vulgate designed for Catholics and performed by George Martin.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ESV">
+				<xs:annotation>
+					<xs:documentation>English Standard</xs:documentation>
+					<xs:documentation>An update of the Revised Standard Version that makes 'modest' use of gender-free terminology.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GDW">
+				<xs:annotation>
+					<xs:documentation>God’s Word</xs:documentation>
+					<xs:documentation>A 1995 translation by the World Bible Publishing Company using the English language in a manner to communicate to the late 20th century American.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GEN">
+				<xs:annotation>
+					<xs:documentation>Geneva</xs:documentation>
+					<xs:documentation>An early (1560) English version of the Bible translated by William Whittingham with strong Protestant leanings.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GNB">
+				<xs:annotation>
+					<xs:documentation>Good News</xs:documentation>
+					<xs:documentation>A translation sponsored by the American Bible Society. The New Testament was first published (as “Today’s English Version” TEV) in 1966. The Old Testament was completed in 1976, and the whole was published as the “Good News Bible”.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GRK">
+				<xs:annotation>
+					<xs:documentation>Original Greek</xs:documentation>
+					<xs:documentation>New Testament text in an original Greek version</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="HBR">
+				<xs:annotation>
+					<xs:documentation>Original Hebrew</xs:documentation>
+					<xs:documentation>Old Testament text in an original Hebrew version</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="HCS">
+				<xs:annotation>
+					<xs:documentation>Holman Christian Standard</xs:documentation>
+					<xs:documentation>Published by Broadman and Holman this translation rejects all forms of gender-neutral wording and is written with strong influences from the Southern Baptist perspective of biblical scholarship.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ICB">
+				<xs:annotation>
+					<xs:documentation>International Children’s</xs:documentation>
+					<xs:documentation>A translation completed in 1986 targeting readability at the US third grade level.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="JER">
+				<xs:annotation>
+					<xs:documentation>Jerusalem</xs:documentation>
+					<xs:documentation>A translation designed for English speaking Catholics based on the original languages. It is based on French as well as ancient texts and was first published in 1966.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="KJV">
+				<xs:annotation>
+					<xs:documentation>King James</xs:documentation>
+					<xs:documentation>A translation commissioned by King James I of England and first published in 1611.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="KJT">
+				<xs:annotation>
+					<xs:documentation>21st Century King James</xs:documentation>
+					<xs:documentation>A verbal translation led by William Prindele. Published in 1994, it was designed to modernize the language of the King James Version based on Webster’s New International Dictionary, 2nd edition, unabridged.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="LVB">
+				<xs:annotation>
+					<xs:documentation>Living Bible</xs:documentation>
+					<xs:documentation>A paraphrase translation led by Kenneth N Taylor and first published in 1972.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MSG">
+				<xs:annotation>
+					<xs:documentation>Message Bible</xs:documentation>
+					<xs:documentation>A paraphrase translation of the New Testament by Eugene Peterson first published in 1993.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NAB">
+				<xs:annotation>
+					<xs:documentation>New American</xs:documentation>
+					<xs:documentation>A translation aimed at Catholic readers first published in its entirely in 1970. A revised New Testament was issued in 1986.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NAS">
+				<xs:annotation>
+					<xs:documentation>New American Standard</xs:documentation>
+					<xs:documentation>A translation commissioned by the Lockman Foundation. The New Testament was published in 1960 followed by the entire Bible in 1971.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NAU">
+				<xs:annotation>
+					<xs:documentation>New American Standard, Updated</xs:documentation>
+					<xs:documentation>A 1995 translation using more modern language than the NASB.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NBA">
+				<xs:annotation>
+					<xs:documentation>Bibelen 1895</xs:documentation>
+					<xs:documentation>Norwegian Bible translation</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NBB">
+				<xs:annotation>
+					<xs:documentation>Bibelen 1930</xs:documentation>
+					<xs:documentation>Norwegian Bible translation</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NBC">
+				<xs:annotation>
+					<xs:documentation>Bibelen 1938</xs:documentation>
+					<xs:documentation>Norwegian Bible translation</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NBD">
+				<xs:annotation>
+					<xs:documentation>Bibelen 1978-85</xs:documentation>
+					<xs:documentation>Norwegian Bible translation</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NBE">
+				<xs:annotation>
+					<xs:documentation>Bibelen 1978</xs:documentation>
+					<xs:documentation>Norwegian Bible translation</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NBF">
+				<xs:annotation>
+					<xs:documentation>Bibelen 1985</xs:documentation>
+					<xs:documentation>Norwegian Bible translation</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NBG">
+				<xs:annotation>
+					<xs:documentation>Bibelen 1988</xs:documentation>
+					<xs:documentation>Norwegian Bible translation</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NBH">
+				<xs:annotation>
+					<xs:documentation>Bibelen 1978-85/rev. 2005</xs:documentation>
+					<xs:documentation>Norwegian Bible translation</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NCV">
+				<xs:annotation>
+					<xs:documentation>New Century</xs:documentation>
+					<xs:documentation>A translation inspired by the International Children’s version. First published by World Publishing in 1991.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NEB">
+				<xs:annotation>
+					<xs:documentation>New English</xs:documentation>
+					<xs:documentation>A translation first issued in 1970 as a result of a proposal at the 1946 General Assembly of the Church of Scotland.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NGO">
+				<xs:annotation>
+					<xs:documentation>Bibelen Guds ord</xs:documentation>
+					<xs:documentation>Norwegian Bible translation</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NIV">
+				<xs:annotation>
+					<xs:documentation>New International</xs:documentation>
+					<xs:documentation>A translation underwritten by the International Bible Society (formerly New York Bible Society). The New Testament was published in 1973 followed by the entire Bible in 1978.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NIR">
+				<xs:annotation>
+					<xs:documentation>New International Reader’s</xs:documentation>
+					<xs:documentation>A 1996 translation designed for people with limited literacy in English and based on the NIV.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NJB">
+				<xs:annotation>
+					<xs:documentation>New Jerusalem</xs:documentation>
+					<xs:documentation>A revision of the Jerusalem Bible. First published in 1986.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NKJ">
+				<xs:annotation>
+					<xs:documentation>New King James</xs:documentation>
+					<xs:documentation>A version issued by Thomas Nelson Publishers in 1982-83 designed to update the language of the King James Version while maintaining the phrasing and rhythm and using the same sources as its predecessor.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NNK">
+				<xs:annotation>
+					<xs:documentation>Bibelen, nynorsk</xs:documentation>
+					<xs:documentation>Norwegian 'nynorsk' Bible translation</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NLV">
+				<xs:annotation>
+					<xs:documentation>New Living</xs:documentation>
+					<xs:documentation>A translation sponsored by Tyndale House and first released in 1996. It is considered a revision and updating of the Living Bible.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NRS">
+				<xs:annotation>
+					<xs:documentation>New Revised Standard</xs:documentation>
+					<xs:documentation>A revision of the Revised Standard based on ancient texts but updating language to American usage of the 1980s.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NVI">
+				<xs:annotation>
+					<xs:documentation>Nueva Version Internacional</xs:documentation>
+					<xs:documentation>A Spanish translation underwritten by the International Bible Society.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PHP">
+				<xs:annotation>
+					<xs:documentation>New Testament in Modern English (Phillips)</xs:documentation>
+					<xs:documentation>An idiomatic translation by J B Phillips, first completed in 1966</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="REB">
+				<xs:annotation>
+					<xs:documentation>Revised English</xs:documentation>
+					<xs:documentation>A 1989 revision of the NEB. A significant effort was made to reduce the British flavor present in the NEB.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="REV">
+				<xs:annotation>
+					<xs:documentation>Revised Version</xs:documentation>
+					<xs:documentation>The first major revision of the King James Version, the Revised Version incorporates insights from early manuscripts discovered between 1611 and 1870, and corrects readings in the KJV which nineteenth-century scholarship deemed mistaken. The New Testament was published in 1881, the Old Testament in 1885, and the Apocrypha in 1895.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="RSV">
+				<xs:annotation>
+					<xs:documentation>Revised Standard</xs:documentation>
+					<xs:documentation>A translation authorized by the National Council of Churches of Christ in the USA. The New Testament was published in 1946 followed by a complete Protestant canon in 1951.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="RVL">
+				<xs:annotation>
+					<xs:documentation>Reina Valera</xs:documentation>
+					<xs:documentation>A Spanish translation based on the original texts.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SMK">
+				<xs:annotation>
+					<xs:documentation>Bibelen, samisk</xs:documentation>
+					<xs:documentation>Norwegian 'samisk' Bible translation</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TEV">
+				<xs:annotation>
+					<xs:documentation>Today’s English</xs:documentation>
+					<xs:documentation>A translation of the New Testament sponsored by the American Bible Society and first published in 1966. It was incorporated into the “Good News Bible” GNB in 1976.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TNI">
+				<xs:annotation>
+					<xs:documentation>Today’s New International</xs:documentation>
+					<xs:documentation>An updating of the New International Version. The New Testament was published in 2002, and the entire Bible is scheduled for 2005.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ZZZ">
+				<xs:annotation>
+					<xs:documentation>Other</xs:documentation>
+					<xs:documentation>Other translations not otherwise noted.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List84">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 84">Study Bible type</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="CAM">
+				<xs:annotation>
+					<xs:documentation>Cambridge Annotated</xs:documentation>
+					<xs:documentation>Contains the work of Howard Clark Kee including a summary of the development of the canon, introductions to the books, notes and cross references. Originally published in 1993, NRSV.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="LIF">
+				<xs:annotation>
+					<xs:documentation>Life Application</xs:documentation>
+					<xs:documentation>A project of Tyndale House Publishers and Zondervan intended to help readers apply the Bible to daily living. Living Bible, King James, New International, NASB</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MAC">
+				<xs:annotation>
+					<xs:documentation>Macarthur</xs:documentation>
+					<xs:documentation>A King James version study Bible with notes by James Macarthur first published in 1997.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="OXF">
+				<xs:annotation>
+					<xs:documentation>Oxford Annotated</xs:documentation>
+					<xs:documentation>A study Bible originally published in the 1960s and based on the RSV / NRSV.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NNT">
+				<xs:annotation>
+					<xs:documentation>Studiebibel, Det Nye testamentet</xs:documentation>
+					<xs:documentation>Norwegian study Bible, New Testament</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NOX">
+				<xs:annotation>
+					<xs:documentation>New Oxford Annotated</xs:documentation>
+					<xs:documentation>Published in 1991 and based on the New Revised Standard version.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NSB">
+				<xs:annotation>
+					<xs:documentation>Norsk studiebibel</xs:documentation>
+					<xs:documentation>Norwegian study Bible</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="RYR">
+				<xs:annotation>
+					<xs:documentation>Ryrie</xs:documentation>
+					<xs:documentation>Based on the work of Charles C. Ryrie. King James, NI, NASB</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SCO">
+				<xs:annotation>
+					<xs:documentation>Scofield</xs:documentation>
+					<xs:documentation>A study Bible based on the early 20th century work of C.I. Scofield. Based on the King James version.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SPR">
+				<xs:annotation>
+					<xs:documentation>Spirit Filled</xs:documentation>
+					<xs:documentation>A transdenominational study Bible for persons from the Pentecostal/Charismatic traditions.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List85">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 85">Bible purpose</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="AW">
+				<xs:annotation>
+					<xs:documentation>Award</xs:documentation>
+					<xs:documentation>A Bible designed for presentation from a religious organization.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BB">
+				<xs:annotation>
+					<xs:documentation>Baby</xs:documentation>
+					<xs:documentation>A Bible designed to be a gift to commemorate a child’s birth.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BR">
+				<xs:annotation>
+					<xs:documentation>Bride</xs:documentation>
+					<xs:documentation>A special gift Bible designed for the bride on her wedding day. Usually white.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CF">
+				<xs:annotation>
+					<xs:documentation>Confirmation</xs:documentation>
+					<xs:documentation>A Bible designed to be used in the confirmation reading or as a gift to a confirmand</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CH">
+				<xs:annotation>
+					<xs:documentation>Children’s</xs:documentation>
+					<xs:documentation>A text Bible designed in presentation and readability for a child.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CM">
+				<xs:annotation>
+					<xs:documentation>Compact</xs:documentation>
+					<xs:documentation>A small Bible with a trim height of five inches or less.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CR">
+				<xs:annotation>
+					<xs:documentation>Cross-reference</xs:documentation>
+					<xs:documentation>A Bible which includes text conveying cross-references to related scripture passages.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="DR">
+				<xs:annotation>
+					<xs:documentation>Daily readings</xs:documentation>
+					<xs:documentation>A Bible laid out to provide readings for each day of the year.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="DV">
+				<xs:annotation>
+					<xs:documentation>Devotional</xs:documentation>
+					<xs:documentation>A Bible containing devotional content together with the scripture.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="FM">
+				<xs:annotation>
+					<xs:documentation>Family</xs:documentation>
+					<xs:documentation>A Bible containing family record pages and/or additional study material for family devotion</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GT">
+				<xs:annotation>
+					<xs:documentation>General/Text</xs:documentation>
+					<xs:documentation>A standard Bible of any version with no distinguishing characteristics beyond the canonical text.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GF">
+				<xs:annotation>
+					<xs:documentation>Gift</xs:documentation>
+					<xs:documentation>A Bible designed for gift or presentation, often including a presentation page.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="LP">
+				<xs:annotation>
+					<xs:documentation>Lectern/Pulpit</xs:documentation>
+					<xs:documentation>A large Bible with large print designed for use in reading scriptures in public worship from either the pulpit or lectern.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MN">
+				<xs:annotation>
+					<xs:documentation>Men’s</xs:documentation>
+					<xs:documentation>A Bible especially designed with helps and study guides oriented to the adult male.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PS">
+				<xs:annotation>
+					<xs:documentation>Primary school</xs:documentation>
+					<xs:documentation>A Bible designed for use in primary school</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PW">
+				<xs:annotation>
+					<xs:documentation>Pew</xs:documentation>
+					<xs:documentation>Usually inexpensive but sturdy, a Bible designed for use in church pews.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SC">
+				<xs:annotation>
+					<xs:documentation>Scholarly</xs:documentation>
+					<xs:documentation>A Bible including texts in Greek and/or Hebrew and designed for scholarly study.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SL">
+				<xs:annotation>
+					<xs:documentation>Slimline</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ST">
+				<xs:annotation>
+					<xs:documentation>Student</xs:documentation>
+					<xs:documentation>A Bible with study articles and helps especially for use in the classroom.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SU">
+				<xs:annotation>
+					<xs:documentation>Study</xs:documentation>
+					<xs:documentation>A Bible with many extra features, e.g. book introductions, dictionary, concordance, references, maps, etc., to help readers better understand the scripture.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="WG">
+				<xs:annotation>
+					<xs:documentation>Wedding gift</xs:documentation>
+					<xs:documentation>A special gift Bible designed as a gift to the couple on their wedding day</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="WM">
+				<xs:annotation>
+					<xs:documentation>Women’s</xs:documentation>
+					<xs:documentation>A devotional or study Bible with helps targeted at the adult woman.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="YT">
+				<xs:annotation>
+					<xs:documentation>Youth</xs:documentation>
+					<xs:documentation>A Bible containing special study and devotional helps designed specifically for the needs of teenagers.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List86">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 86">Bible text organization</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="CHR">
+				<xs:annotation>
+					<xs:documentation>Chronological</xs:documentation>
+					<xs:documentation>A Bible with the text organized in the order in which events are believed to have happened.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CHA">
+				<xs:annotation>
+					<xs:documentation>Chain reference</xs:documentation>
+					<xs:documentation>A Bible which explores keywords or themes by referring text to preceding or following text.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="INT">
+				<xs:annotation>
+					<xs:documentation>Interlinear</xs:documentation>
+					<xs:documentation>A Bible or other text in which different versions are printed one line above the other, so that the variations can easily be detected.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PAR">
+				<xs:annotation>
+					<xs:documentation>Parallel</xs:documentation>
+					<xs:documentation>A Bible with two or more versions printed side by side.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="STN">
+				<xs:annotation>
+					<xs:documentation>Standard</xs:documentation>
+					<xs:documentation>A Bible in which the text is presented in the traditional order.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List87">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 87">Bible reference location</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="CCL">
+				<xs:annotation>
+					<xs:documentation>Center column</xs:documentation>
+					<xs:documentation>References are printed in a narrow column in the center of the page between two columns of text.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PGE">
+				<xs:annotation>
+					<xs:documentation>Page end</xs:documentation>
+					<xs:documentation>References are printed at the foot of the page.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SID">
+				<xs:annotation>
+					<xs:documentation>Side column</xs:documentation>
+					<xs:documentation>References are printed in a column to the side of the scripture.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="VER">
+				<xs:annotation>
+					<xs:documentation>Verse end</xs:documentation>
+					<xs:documentation>References are printed at the end of the applicable verse.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="UNK">
+				<xs:annotation>
+					<xs:documentation>Unknown</xs:documentation>
+					<xs:documentation>The person creating the ONIX record does not know where the references are located.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ZZZ">
+				<xs:annotation>
+					<xs:documentation>Other</xs:documentation>
+					<xs:documentation>Other locations not otherwise identified</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List88">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 88">Religious text identifier</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string"/>
+	</xs:simpleType>
+	<xs:simpleType name="List89">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 89">Religious text feature type</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string"/>
+	</xs:simpleType>
+	<xs:simpleType name="List90">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 90">Religious text feature code</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string"/>
+	</xs:simpleType>
+	<xs:simpleType name="List91">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 91">Country code - ISO 3166-1</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="AD">
+				<xs:annotation>
+					<xs:documentation>Andorra</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AE">
+				<xs:annotation>
+					<xs:documentation>United Arab Emirates</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AF">
+				<xs:annotation>
+					<xs:documentation>Afghanistan</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AG">
+				<xs:annotation>
+					<xs:documentation>Antigua and Barbuda</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AI">
+				<xs:annotation>
+					<xs:documentation>Anguilla</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AL">
+				<xs:annotation>
+					<xs:documentation>Albania</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AM">
+				<xs:annotation>
+					<xs:documentation>Armenia</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AN">
+				<xs:annotation>
+					<xs:documentation>Netherlands Antilles</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AO">
+				<xs:annotation>
+					<xs:documentation>Angola</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AQ">
+				<xs:annotation>
+					<xs:documentation>Antarctica</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AR">
+				<xs:annotation>
+					<xs:documentation>Argentina</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AS">
+				<xs:annotation>
+					<xs:documentation>American Samoa</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AT">
+				<xs:annotation>
+					<xs:documentation>Austria</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AU">
+				<xs:annotation>
+					<xs:documentation>Australia</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AW">
+				<xs:annotation>
+					<xs:documentation>Aruba</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AX">
+				<xs:annotation>
+					<xs:documentation>Aland Islands</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AZ">
+				<xs:annotation>
+					<xs:documentation>Azerbaijan</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BA">
+				<xs:annotation>
+					<xs:documentation>Bosnia and Herzegovina</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BB">
+				<xs:annotation>
+					<xs:documentation>Barbados</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BD">
+				<xs:annotation>
+					<xs:documentation>Bangladesh</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BE">
+				<xs:annotation>
+					<xs:documentation>Belgium</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BF">
+				<xs:annotation>
+					<xs:documentation>Burkina Faso</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BG">
+				<xs:annotation>
+					<xs:documentation>Bulgaria</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BH">
+				<xs:annotation>
+					<xs:documentation>Bahrain</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BI">
+				<xs:annotation>
+					<xs:documentation>Burundi</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BJ">
+				<xs:annotation>
+					<xs:documentation>Benin</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BM">
+				<xs:annotation>
+					<xs:documentation>Bermuda</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BN">
+				<xs:annotation>
+					<xs:documentation>Brunei Darussalam</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BO">
+				<xs:annotation>
+					<xs:documentation>Bolivia</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BR">
+				<xs:annotation>
+					<xs:documentation>Brazil</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BS">
+				<xs:annotation>
+					<xs:documentation>Bahamas</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BT">
+				<xs:annotation>
+					<xs:documentation>Bhutan</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BV">
+				<xs:annotation>
+					<xs:documentation>Bouvet Island</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BW">
+				<xs:annotation>
+					<xs:documentation>Botswana</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BY">
+				<xs:annotation>
+					<xs:documentation>Belarus</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BZ">
+				<xs:annotation>
+					<xs:documentation>Belize</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CA">
+				<xs:annotation>
+					<xs:documentation>Canada</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CC">
+				<xs:annotation>
+					<xs:documentation>Cocos (Keeling) Islands</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CD">
+				<xs:annotation>
+					<xs:documentation>Congo, Democratic Republic of the</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CF">
+				<xs:annotation>
+					<xs:documentation>Central African Republic</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CG">
+				<xs:annotation>
+					<xs:documentation>Congo</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CH">
+				<xs:annotation>
+					<xs:documentation>Switzerland</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CI">
+				<xs:annotation>
+					<xs:documentation>Cote D'Ivoire</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CK">
+				<xs:annotation>
+					<xs:documentation>Cook Islands</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CL">
+				<xs:annotation>
+					<xs:documentation>Chile</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CM">
+				<xs:annotation>
+					<xs:documentation>Cameroon</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CN">
+				<xs:annotation>
+					<xs:documentation>China</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CO">
+				<xs:annotation>
+					<xs:documentation>Colombia</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CR">
+				<xs:annotation>
+					<xs:documentation>Costa Rica</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CS">
+				<xs:annotation>
+					<xs:documentation>Serbia and Montenegro</xs:documentation>
+					<xs:documentation>Replaces YU – Yugoslavia</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CU">
+				<xs:annotation>
+					<xs:documentation>Cuba</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CV">
+				<xs:annotation>
+					<xs:documentation>Cape Verde</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CX">
+				<xs:annotation>
+					<xs:documentation>Christmas Island</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CY">
+				<xs:annotation>
+					<xs:documentation>Cyprus</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CZ">
+				<xs:annotation>
+					<xs:documentation>Czech Republic</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="DE">
+				<xs:annotation>
+					<xs:documentation>Germany</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="DJ">
+				<xs:annotation>
+					<xs:documentation>Djibouti</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="DK">
+				<xs:annotation>
+					<xs:documentation>Denmark</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="DM">
+				<xs:annotation>
+					<xs:documentation>Dominica</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="DO">
+				<xs:annotation>
+					<xs:documentation>Dominican Republic</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="DZ">
+				<xs:annotation>
+					<xs:documentation>Algeria</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="EC">
+				<xs:annotation>
+					<xs:documentation>Ecuador</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="EE">
+				<xs:annotation>
+					<xs:documentation>Estonia</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="EG">
+				<xs:annotation>
+					<xs:documentation>Egypt</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="EH">
+				<xs:annotation>
+					<xs:documentation>Western Sahara</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ER">
+				<xs:annotation>
+					<xs:documentation>Eritrea</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ES">
+				<xs:annotation>
+					<xs:documentation>Spain</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ET">
+				<xs:annotation>
+					<xs:documentation>Ethiopia</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="FI">
+				<xs:annotation>
+					<xs:documentation>Finland</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="FJ">
+				<xs:annotation>
+					<xs:documentation>Fiji</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="FK">
+				<xs:annotation>
+					<xs:documentation>Falkland Islands (Malvinas)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="FM">
+				<xs:annotation>
+					<xs:documentation>Micronesia, Federated States of</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="FO">
+				<xs:annotation>
+					<xs:documentation>Faroe Islands</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="FR">
+				<xs:annotation>
+					<xs:documentation>France</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GA">
+				<xs:annotation>
+					<xs:documentation>Gabon</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GB">
+				<xs:annotation>
+					<xs:documentation>United Kingdom</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GD">
+				<xs:annotation>
+					<xs:documentation>Grenada</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GE">
+				<xs:annotation>
+					<xs:documentation>Georgia</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GF">
+				<xs:annotation>
+					<xs:documentation>French Guiana</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GH">
+				<xs:annotation>
+					<xs:documentation>Ghana</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GI">
+				<xs:annotation>
+					<xs:documentation>Gibraltar</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GL">
+				<xs:annotation>
+					<xs:documentation>Greenland</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GM">
+				<xs:annotation>
+					<xs:documentation>Gambia</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GN">
+				<xs:annotation>
+					<xs:documentation>Guinea</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GP">
+				<xs:annotation>
+					<xs:documentation>Guadeloupe</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GQ">
+				<xs:annotation>
+					<xs:documentation>Equatorial Guinea</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GR">
+				<xs:annotation>
+					<xs:documentation>Greece</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GS">
+				<xs:annotation>
+					<xs:documentation>South Georgia and the South Sandwich Islands</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GT">
+				<xs:annotation>
+					<xs:documentation>Guatemala</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GU">
+				<xs:annotation>
+					<xs:documentation>Guam</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GW">
+				<xs:annotation>
+					<xs:documentation>Guinea-Bissau</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GY">
+				<xs:annotation>
+					<xs:documentation>Guyana</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="HK">
+				<xs:annotation>
+					<xs:documentation>Hong Kong</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="HM">
+				<xs:annotation>
+					<xs:documentation>Heard Island and McDonald Islands</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="HN">
+				<xs:annotation>
+					<xs:documentation>Honduras</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="HR">
+				<xs:annotation>
+					<xs:documentation>Croatia</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="HT">
+				<xs:annotation>
+					<xs:documentation>Haiti</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="HU">
+				<xs:annotation>
+					<xs:documentation>Hungary</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ID">
+				<xs:annotation>
+					<xs:documentation>Indonesia</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="IE">
+				<xs:annotation>
+					<xs:documentation>Ireland</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="IL">
+				<xs:annotation>
+					<xs:documentation>Israel</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="IN">
+				<xs:annotation>
+					<xs:documentation>India</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="IO">
+				<xs:annotation>
+					<xs:documentation>British Indian Ocean Territory</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="IQ">
+				<xs:annotation>
+					<xs:documentation>Iraq</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="IR">
+				<xs:annotation>
+					<xs:documentation>Iran, Islamic Republic of</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="IS">
+				<xs:annotation>
+					<xs:documentation>Iceland</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="IT">
+				<xs:annotation>
+					<xs:documentation>Italy</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="JM">
+				<xs:annotation>
+					<xs:documentation>Jamaica</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="JO">
+				<xs:annotation>
+					<xs:documentation>Jordan</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="JP">
+				<xs:annotation>
+					<xs:documentation>Japan</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="KE">
+				<xs:annotation>
+					<xs:documentation>Kenya</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="KG">
+				<xs:annotation>
+					<xs:documentation>Kyrgyzstan</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="KH">
+				<xs:annotation>
+					<xs:documentation>Cambodia</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="KI">
+				<xs:annotation>
+					<xs:documentation>Kiribati</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="KM">
+				<xs:annotation>
+					<xs:documentation>Comoros</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="KN">
+				<xs:annotation>
+					<xs:documentation>Saint Kitts and Nevis</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="KP">
+				<xs:annotation>
+					<xs:documentation>Korea, Democratic People's Republic of</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="KR">
+				<xs:annotation>
+					<xs:documentation>Korea, Republic of</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="KW">
+				<xs:annotation>
+					<xs:documentation>Kuwait</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="KY">
+				<xs:annotation>
+					<xs:documentation>Cayman Islands</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="KZ">
+				<xs:annotation>
+					<xs:documentation>Kazakhstan</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="LA">
+				<xs:annotation>
+					<xs:documentation>Lao People's Democratic Republic</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="LB">
+				<xs:annotation>
+					<xs:documentation>Lebanon</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="LC">
+				<xs:annotation>
+					<xs:documentation>Saint Lucia</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="LI">
+				<xs:annotation>
+					<xs:documentation>Liechtenstein</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="LK">
+				<xs:annotation>
+					<xs:documentation>Sri Lanka</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="LR">
+				<xs:annotation>
+					<xs:documentation>Liberia</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="LS">
+				<xs:annotation>
+					<xs:documentation>Lesotho</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="LT">
+				<xs:annotation>
+					<xs:documentation>Lithuania</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="LU">
+				<xs:annotation>
+					<xs:documentation>Luxembourg</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="LV">
+				<xs:annotation>
+					<xs:documentation>Latvia</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="LY">
+				<xs:annotation>
+					<xs:documentation>Libyan Arab Jamahiriya</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MA">
+				<xs:annotation>
+					<xs:documentation>Morocco</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MC">
+				<xs:annotation>
+					<xs:documentation>Monaco</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MD">
+				<xs:annotation>
+					<xs:documentation>Moldova, Republic of</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MG">
+				<xs:annotation>
+					<xs:documentation>Madagascar</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MH">
+				<xs:annotation>
+					<xs:documentation>Marshall Islands</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MK">
+				<xs:annotation>
+					<xs:documentation>Macedonia, the former Yugoslav Republic of</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ML">
+				<xs:annotation>
+					<xs:documentation>Mali</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MM">
+				<xs:annotation>
+					<xs:documentation>Myanmar</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MN">
+				<xs:annotation>
+					<xs:documentation>Mongolia</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MO">
+				<xs:annotation>
+					<xs:documentation>Macao</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MP">
+				<xs:annotation>
+					<xs:documentation>Northern Mariana Islands</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MQ">
+				<xs:annotation>
+					<xs:documentation>Martinique</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MR">
+				<xs:annotation>
+					<xs:documentation>Mauritania</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MS">
+				<xs:annotation>
+					<xs:documentation>Montserrat</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MT">
+				<xs:annotation>
+					<xs:documentation>Malta</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MU">
+				<xs:annotation>
+					<xs:documentation>Mauritius</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MV">
+				<xs:annotation>
+					<xs:documentation>Maldives</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MW">
+				<xs:annotation>
+					<xs:documentation>Malawi</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MX">
+				<xs:annotation>
+					<xs:documentation>Mexico</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MY">
+				<xs:annotation>
+					<xs:documentation>Malaysia</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MZ">
+				<xs:annotation>
+					<xs:documentation>Mozambique</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NA">
+				<xs:annotation>
+					<xs:documentation>Namibia</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NC">
+				<xs:annotation>
+					<xs:documentation>New Caledonia</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NE">
+				<xs:annotation>
+					<xs:documentation>Niger</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NF">
+				<xs:annotation>
+					<xs:documentation>Norfolk Island</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NG">
+				<xs:annotation>
+					<xs:documentation>Nigeria</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NI">
+				<xs:annotation>
+					<xs:documentation>Nicaragua</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NL">
+				<xs:annotation>
+					<xs:documentation>Netherlands</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NO">
+				<xs:annotation>
+					<xs:documentation>Norway</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NP">
+				<xs:annotation>
+					<xs:documentation>Nepal</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NR">
+				<xs:annotation>
+					<xs:documentation>Nauru</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NU">
+				<xs:annotation>
+					<xs:documentation>Niue</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NZ">
+				<xs:annotation>
+					<xs:documentation>New Zealand</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="OM">
+				<xs:annotation>
+					<xs:documentation>Oman</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PA">
+				<xs:annotation>
+					<xs:documentation>Panama</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PE">
+				<xs:annotation>
+					<xs:documentation>Peru</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PF">
+				<xs:annotation>
+					<xs:documentation>French Polynesia</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PG">
+				<xs:annotation>
+					<xs:documentation>Papua New Guinea</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PH">
+				<xs:annotation>
+					<xs:documentation>Philippines</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PK">
+				<xs:annotation>
+					<xs:documentation>Pakistan</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PL">
+				<xs:annotation>
+					<xs:documentation>Poland</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PM">
+				<xs:annotation>
+					<xs:documentation>Saint Pierre and Miquelon</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PN">
+				<xs:annotation>
+					<xs:documentation>Pitcairn</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PR">
+				<xs:annotation>
+					<xs:documentation>Puerto Rico</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PS">
+				<xs:annotation>
+					<xs:documentation>Palestinian Territory, Occupied</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PT">
+				<xs:annotation>
+					<xs:documentation>Portugal</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PW">
+				<xs:annotation>
+					<xs:documentation>Palau</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PY">
+				<xs:annotation>
+					<xs:documentation>Paraguay</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="QA">
+				<xs:annotation>
+					<xs:documentation>Qatar</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="RE">
+				<xs:annotation>
+					<xs:documentation>Reunion</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="RO">
+				<xs:annotation>
+					<xs:documentation>Romania</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="RU">
+				<xs:annotation>
+					<xs:documentation>Russian Federation</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="RW">
+				<xs:annotation>
+					<xs:documentation>Rwanda</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SA">
+				<xs:annotation>
+					<xs:documentation>Saudi Arabia</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SB">
+				<xs:annotation>
+					<xs:documentation>Solomon Islands</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SC">
+				<xs:annotation>
+					<xs:documentation>Seychelles</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SD">
+				<xs:annotation>
+					<xs:documentation>Sudan</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SE">
+				<xs:annotation>
+					<xs:documentation>Sweden</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SG">
+				<xs:annotation>
+					<xs:documentation>Singapore</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SH">
+				<xs:annotation>
+					<xs:documentation>Saint Helena</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SI">
+				<xs:annotation>
+					<xs:documentation>Slovenia</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SJ">
+				<xs:annotation>
+					<xs:documentation>Svalbard and Jan Mayen</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SK">
+				<xs:annotation>
+					<xs:documentation>Slovakia</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SL">
+				<xs:annotation>
+					<xs:documentation>Sierra Leone</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SM">
+				<xs:annotation>
+					<xs:documentation>San Marino</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SN">
+				<xs:annotation>
+					<xs:documentation>Senegal</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SO">
+				<xs:annotation>
+					<xs:documentation>Somalia</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SR">
+				<xs:annotation>
+					<xs:documentation>Suriname</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ST">
+				<xs:annotation>
+					<xs:documentation>Sao Tome and Principe</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SV">
+				<xs:annotation>
+					<xs:documentation>El Salvador</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SY">
+				<xs:annotation>
+					<xs:documentation>Syrian Arab Republic</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SZ">
+				<xs:annotation>
+					<xs:documentation>Swaziland</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TC">
+				<xs:annotation>
+					<xs:documentation>Turks and Caicos Islands</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TD">
+				<xs:annotation>
+					<xs:documentation>Chad</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TF">
+				<xs:annotation>
+					<xs:documentation>French Southern Territories</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TG">
+				<xs:annotation>
+					<xs:documentation>Togo</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TH">
+				<xs:annotation>
+					<xs:documentation>Thailand</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TJ">
+				<xs:annotation>
+					<xs:documentation>Tajikistan</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TK">
+				<xs:annotation>
+					<xs:documentation>Tokelau</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TL">
+				<xs:annotation>
+					<xs:documentation>Timor-Leste</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TM">
+				<xs:annotation>
+					<xs:documentation>Turkmenistan</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TN">
+				<xs:annotation>
+					<xs:documentation>Tunisia</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TO">
+				<xs:annotation>
+					<xs:documentation>Tonga</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TR">
+				<xs:annotation>
+					<xs:documentation>Turkey</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TT">
+				<xs:annotation>
+					<xs:documentation>Trinidad and Tobago</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TV">
+				<xs:annotation>
+					<xs:documentation>Tuvalu</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TW">
+				<xs:annotation>
+					<xs:documentation>Taiwan, Province of China</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TZ">
+				<xs:annotation>
+					<xs:documentation>Tanzania, United Republic of</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="UA">
+				<xs:annotation>
+					<xs:documentation>Ukraine</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="UG">
+				<xs:annotation>
+					<xs:documentation>Uganda</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="UM">
+				<xs:annotation>
+					<xs:documentation>United States Minor Outlying Islands</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="US">
+				<xs:annotation>
+					<xs:documentation>United States</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="UY">
+				<xs:annotation>
+					<xs:documentation>Uruguay</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="UZ">
+				<xs:annotation>
+					<xs:documentation>Uzbekistan</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="VA">
+				<xs:annotation>
+					<xs:documentation>Holy See (Vatican City State)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="VC">
+				<xs:annotation>
+					<xs:documentation>Saint Vincent and the Grenadines</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="VE">
+				<xs:annotation>
+					<xs:documentation>Venezuela</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="VG">
+				<xs:annotation>
+					<xs:documentation>Virgin Islands, British</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="VI">
+				<xs:annotation>
+					<xs:documentation>Virgin Islands, US</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="VN">
+				<xs:annotation>
+					<xs:documentation>Viet Nam</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="VU">
+				<xs:annotation>
+					<xs:documentation>Vanuatu</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="WF">
+				<xs:annotation>
+					<xs:documentation>Wallis and Futuna</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="WS">
+				<xs:annotation>
+					<xs:documentation>Samoa</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="YE">
+				<xs:annotation>
+					<xs:documentation>Yemen</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="YT">
+				<xs:annotation>
+					<xs:documentation>Mayotte</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="YU">
+				<xs:annotation>
+					<xs:documentation>Yugoslavia</xs:documentation>
+					<xs:documentation>DEPRECATED, replaced by CS – Serbia and Montenegro</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ZA">
+				<xs:annotation>
+					<xs:documentation>South Africa</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ZM">
+				<xs:annotation>
+					<xs:documentation>Zambia</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ZW">
+				<xs:annotation>
+					<xs:documentation>Zimbabwe</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List92">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 92">Supplier identifier type</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Proprietary</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Börsenverein Verkehrsnummer</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>German ISBN Agency publisher identifier</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>EAN-UCC GLN</xs:documentation>
+					<xs:documentation>Global location number (formerly EAN location number)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="07">
+				<xs:annotation>
+					<xs:documentation>SAN</xs:documentation>
+					<xs:documentation>Book trade Standard Address Number - US, UK etc</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List93">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 93">Supplier role</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="00">
+				<xs:annotation>
+					<xs:documentation>Unspecified</xs:documentation>
+					<xs:documentation>Default</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Publisher</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Publisher's exclusive distributor</xs:documentation>
+					<xs:documentation>In a specified supply territory</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>Publisher's non-exclusive distributor</xs:documentation>
+					<xs:documentation>In a specified supply territory</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Wholesaler</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>Sales agent</xs:documentation>
+					<xs:documentation>DEPRECATED - use &lt;MarketRepresentation&gt; to specify a sales agent</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>Publisher's distributor</xs:documentation>
+					<xs:documentation>In a specified supply territory. Use only where exclusive/non-exclusive status is not known. Prefer 02 or 03 as appropriate, where possible.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="07">
+				<xs:annotation>
+					<xs:documentation>POD supplier</xs:documentation>
+					<xs:documentation>Where a POD product is supplied to retailers and/or consumers direct from a POD source.</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List94">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 94">Default linear unit</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="cm">
+				<xs:annotation>
+					<xs:documentation>Centimeters</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="in">
+				<xs:annotation>
+					<xs:documentation>Inches (US)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="mm">
+				<xs:annotation>
+					<xs:documentation>Millimeters</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List95">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 95">Default unit of weight</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="lb">
+				<xs:annotation>
+					<xs:documentation>Pounds (US)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="gr">
+				<xs:annotation>
+					<xs:documentation>Grams</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="oz">
+				<xs:annotation>
+					<xs:documentation>Ounces (US)</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List96">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 96">Currency code - ISO 4217</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="AED">
+				<xs:annotation>
+					<xs:documentation>UAE Dirham</xs:documentation>
+					<xs:documentation>United Arab Emirates</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AFA">
+				<xs:annotation>
+					<xs:documentation>Afghani</xs:documentation>
+					<xs:documentation>DEPRECATED, replaced by AFN</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AFN">
+				<xs:annotation>
+					<xs:documentation>Afghani</xs:documentation>
+					<xs:documentation>Afghanistan</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ALL">
+				<xs:annotation>
+					<xs:documentation>Lek</xs:documentation>
+					<xs:documentation>Albania</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AMD">
+				<xs:annotation>
+					<xs:documentation>Armenian Dram</xs:documentation>
+					<xs:documentation>Armenia</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ANG">
+				<xs:annotation>
+					<xs:documentation>Netherlands Antillian Guilder</xs:documentation>
+					<xs:documentation>Netherlands Antilles</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AOA">
+				<xs:annotation>
+					<xs:documentation>Kwanza</xs:documentation>
+					<xs:documentation>Angola</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ARS">
+				<xs:annotation>
+					<xs:documentation>Argentine Peso</xs:documentation>
+					<xs:documentation>Argentina</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ATS">
+				<xs:annotation>
+					<xs:documentation>Austria, Schilling</xs:documentation>
+					<xs:documentation>Now replaced by the Euro (EUR): use only for historical prices that pre-date the introduction of the Euro</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AUD">
+				<xs:annotation>
+					<xs:documentation>Australian Dollar</xs:documentation>
+					<xs:documentation>Australia, Christmas Island, Cocos (Keeling) Islands, Heard Island and McDonald Islands, Kiribati, Nauru, Norfolk Island, Tuvalu</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AWG">
+				<xs:annotation>
+					<xs:documentation>Aruban Guilder</xs:documentation>
+					<xs:documentation>Aruba</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="AZM">
+				<xs:annotation>
+					<xs:documentation>Azerbaijanian Manat</xs:documentation>
+					<xs:documentation>Azerbaijan</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BAM">
+				<xs:annotation>
+					<xs:documentation>Convertible Marks</xs:documentation>
+					<xs:documentation>Bosnia &amp; Herzegovina</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BBD">
+				<xs:annotation>
+					<xs:documentation>Barbados Dollar</xs:documentation>
+					<xs:documentation>Barbados</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BDT">
+				<xs:annotation>
+					<xs:documentation>Taka</xs:documentation>
+					<xs:documentation>Bangladesh</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BEF">
+				<xs:annotation>
+					<xs:documentation>Belgium, Franc</xs:documentation>
+					<xs:documentation>Now replaced by the Euro (EUR): use only for historical prices that pre-date the introduction of the Euro</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BGL">
+				<xs:annotation>
+					<xs:documentation>Lev</xs:documentation>
+					<xs:documentation>DEPRECATED, replaced by BGN</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BGN">
+				<xs:annotation>
+					<xs:documentation>Lev</xs:documentation>
+					<xs:documentation>Bulgaria</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BHD">
+				<xs:annotation>
+					<xs:documentation>Bahraini Dinar</xs:documentation>
+					<xs:documentation>Bahrain</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BIF">
+				<xs:annotation>
+					<xs:documentation>Burundi Franc</xs:documentation>
+					<xs:documentation>Burundi</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BMD">
+				<xs:annotation>
+					<xs:documentation>Bermuda Dollar</xs:documentation>
+					<xs:documentation>Bermuda</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BND">
+				<xs:annotation>
+					<xs:documentation>Brunei Dollar</xs:documentation>
+					<xs:documentation>Brunei Darussalam</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BOB">
+				<xs:annotation>
+					<xs:documentation>Boliviano</xs:documentation>
+					<xs:documentation>Bolivia</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BRL">
+				<xs:annotation>
+					<xs:documentation>Brazilian Real</xs:documentation>
+					<xs:documentation>Brazil</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BSD">
+				<xs:annotation>
+					<xs:documentation>Bahamian Dollar</xs:documentation>
+					<xs:documentation>Bahamas</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BTN">
+				<xs:annotation>
+					<xs:documentation>Ngultrun</xs:documentation>
+					<xs:documentation>Bhutan</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BWP">
+				<xs:annotation>
+					<xs:documentation>Pula</xs:documentation>
+					<xs:documentation>Botswana</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BYR">
+				<xs:annotation>
+					<xs:documentation>Belarussian Ruble</xs:documentation>
+					<xs:documentation>Belarus</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BZD">
+				<xs:annotation>
+					<xs:documentation>Belize Dollar</xs:documentation>
+					<xs:documentation>Belize</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CAD">
+				<xs:annotation>
+					<xs:documentation>Canadian Dollar</xs:documentation>
+					<xs:documentation>Canada</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CDF">
+				<xs:annotation>
+					<xs:documentation>Franc Congolais</xs:documentation>
+					<xs:documentation>Congo (Democratic Republic of the)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CHF">
+				<xs:annotation>
+					<xs:documentation>Swiss Franc</xs:documentation>
+					<xs:documentation>Switzerland, Liechtenstein</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CLP">
+				<xs:annotation>
+					<xs:documentation>Chilean Peso</xs:documentation>
+					<xs:documentation>Chile</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CNY">
+				<xs:annotation>
+					<xs:documentation>Yuan Renminbi</xs:documentation>
+					<xs:documentation>China</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="COP">
+				<xs:annotation>
+					<xs:documentation>Colombian Peso</xs:documentation>
+					<xs:documentation>Colombia</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CRC">
+				<xs:annotation>
+					<xs:documentation>Costa Rican Colon</xs:documentation>
+					<xs:documentation>Costa Rica</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CSD">
+				<xs:annotation>
+					<xs:documentation>Serbian Dinar</xs:documentation>
+					<xs:documentation>Serbia</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CUC">
+				<xs:annotation>
+					<xs:documentation>Cuban Convertible Peso</xs:documentation>
+					<xs:documentation>Cuba (alternative currency)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CUP">
+				<xs:annotation>
+					<xs:documentation>Cuban Peso</xs:documentation>
+					<xs:documentation>Cuba</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CVE">
+				<xs:annotation>
+					<xs:documentation>Cape Verde Escudo</xs:documentation>
+					<xs:documentation>Cape Verde</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CYP">
+				<xs:annotation>
+					<xs:documentation>Cyprus Pound</xs:documentation>
+					<xs:documentation>Cyprus</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CZK">
+				<xs:annotation>
+					<xs:documentation>Czech Koruna</xs:documentation>
+					<xs:documentation>Czech Republic</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="DEM">
+				<xs:annotation>
+					<xs:documentation>Germany, Mark</xs:documentation>
+					<xs:documentation>Now replaced by the Euro (EUR): use only for historical prices that pre-date the introduction of the Euro</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="DJF">
+				<xs:annotation>
+					<xs:documentation>Djibouti Franc</xs:documentation>
+					<xs:documentation>Djibouti</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="DKK">
+				<xs:annotation>
+					<xs:documentation>Danish Krone</xs:documentation>
+					<xs:documentation>Denmark, Faroe Islands, Greenland</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="DOP">
+				<xs:annotation>
+					<xs:documentation>Dominican Peso</xs:documentation>
+					<xs:documentation>Dominican Republic</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="DZD">
+				<xs:annotation>
+					<xs:documentation>Algerian Dinar</xs:documentation>
+					<xs:documentation>Algeria</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="EEK">
+				<xs:annotation>
+					<xs:documentation>Kroon</xs:documentation>
+					<xs:documentation>Estonia</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="EGP">
+				<xs:annotation>
+					<xs:documentation>Egyptian Pound</xs:documentation>
+					<xs:documentation>Egypt</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ERN">
+				<xs:annotation>
+					<xs:documentation>Nakfa</xs:documentation>
+					<xs:documentation>Eritrea</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ESP">
+				<xs:annotation>
+					<xs:documentation>Spain, Peseta</xs:documentation>
+					<xs:documentation>Now replaced by the Euro (EUR): use only for historical prices that pre-date the introduction of the Euro</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ETB">
+				<xs:annotation>
+					<xs:documentation>Ethiopian Birr</xs:documentation>
+					<xs:documentation>Ethiopia</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="EUR">
+				<xs:annotation>
+					<xs:documentation>Euro</xs:documentation>
+					<xs:documentation>Andorra, Austria, Belgium, Finland, France, Fr Guiana, Fr S Territories, Germany, Greece, Guadeloupe, Holy See (Vatican City), Ireland, Italy, Luxembourg, Martinique, Mayotte, Monaco, Netherlands, Portugal, Réunion, St Pierre &amp; Miquelon, San Marino, Spain</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="FIM">
+				<xs:annotation>
+					<xs:documentation>Finland, Markka</xs:documentation>
+					<xs:documentation>Now replaced by the Euro (EUR): use only for historical prices that pre-date the introduction of the Euro</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="FJD">
+				<xs:annotation>
+					<xs:documentation>Fiji Dollar</xs:documentation>
+					<xs:documentation>Fiji</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="FKP">
+				<xs:annotation>
+					<xs:documentation>Falkland Islands Pound</xs:documentation>
+					<xs:documentation>Falkland Islands (Malvinas)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="FRF">
+				<xs:annotation>
+					<xs:documentation>France, Franc</xs:documentation>
+					<xs:documentation>Now replaced by the Euro (EUR): use only for historical prices that pre-date the introduction of the Euro</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GBP">
+				<xs:annotation>
+					<xs:documentation>Pound Sterling</xs:documentation>
+					<xs:documentation>United Kingdom</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GEL">
+				<xs:annotation>
+					<xs:documentation>Lari</xs:documentation>
+					<xs:documentation>Georgia</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GHC">
+				<xs:annotation>
+					<xs:documentation>Cedi</xs:documentation>
+					<xs:documentation>Ghana</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GIP">
+				<xs:annotation>
+					<xs:documentation>Gibraltar Pound</xs:documentation>
+					<xs:documentation>Gibraltar</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GMD">
+				<xs:annotation>
+					<xs:documentation>Dalasi</xs:documentation>
+					<xs:documentation>Gambia</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GNF">
+				<xs:annotation>
+					<xs:documentation>Guinea Franc</xs:documentation>
+					<xs:documentation>Guinea</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GRD">
+				<xs:annotation>
+					<xs:documentation>Greece, Drachma</xs:documentation>
+					<xs:documentation>Now replaced by the Euro (EUR): use only for historical prices that pre-date the introduction of the Euro</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GTQ">
+				<xs:annotation>
+					<xs:documentation>Quetzal</xs:documentation>
+					<xs:documentation>Guatemala</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GWP">
+				<xs:annotation>
+					<xs:documentation>Guinea-Bissau Peso</xs:documentation>
+					<xs:documentation>Guinea-Bissau</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GYD">
+				<xs:annotation>
+					<xs:documentation>Guyana Dollar</xs:documentation>
+					<xs:documentation>Guyana</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="HKD">
+				<xs:annotation>
+					<xs:documentation>Hong Kong Dollar</xs:documentation>
+					<xs:documentation>Hong Kong</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="HNL">
+				<xs:annotation>
+					<xs:documentation>Lempira</xs:documentation>
+					<xs:documentation>Honduras</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="HRK">
+				<xs:annotation>
+					<xs:documentation>Croatian Kuna</xs:documentation>
+					<xs:documentation>Croatia</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="HTG">
+				<xs:annotation>
+					<xs:documentation>Gourde</xs:documentation>
+					<xs:documentation>Haiti</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="HUF">
+				<xs:annotation>
+					<xs:documentation>Forint</xs:documentation>
+					<xs:documentation>Hungary</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="IDR">
+				<xs:annotation>
+					<xs:documentation>Rupiah</xs:documentation>
+					<xs:documentation>Indonesia</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="IEP">
+				<xs:annotation>
+					<xs:documentation>Ireland, Punt</xs:documentation>
+					<xs:documentation>Now replaced by the Euro (EUR): use only for historical prices that pre-date the introduction of the Euro</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ILS">
+				<xs:annotation>
+					<xs:documentation>Israeli Sheqel</xs:documentation>
+					<xs:documentation>Israel</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="INR">
+				<xs:annotation>
+					<xs:documentation>Indian Rupee</xs:documentation>
+					<xs:documentation>India</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="IQD">
+				<xs:annotation>
+					<xs:documentation>Iraqi Dinar</xs:documentation>
+					<xs:documentation>Iraq</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="IRR">
+				<xs:annotation>
+					<xs:documentation>Iranian Rial</xs:documentation>
+					<xs:documentation>Iran (Islamic Republic of)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ISK">
+				<xs:annotation>
+					<xs:documentation>Iceland Krona</xs:documentation>
+					<xs:documentation>Iceland</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ITL">
+				<xs:annotation>
+					<xs:documentation>Italy, Lira</xs:documentation>
+					<xs:documentation>Now replaced by the Euro (EUR): use only for historical prices that pre-date the introduction of the Euro</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="JMD">
+				<xs:annotation>
+					<xs:documentation>Jamaican Dollar</xs:documentation>
+					<xs:documentation>Jamaica</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="JOD">
+				<xs:annotation>
+					<xs:documentation>Jordanian Dinar</xs:documentation>
+					<xs:documentation>Jordan</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="JPY">
+				<xs:annotation>
+					<xs:documentation>Yen</xs:documentation>
+					<xs:documentation>Japan</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="KES">
+				<xs:annotation>
+					<xs:documentation>Kenyan Shilling</xs:documentation>
+					<xs:documentation>Kenya</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="KGS">
+				<xs:annotation>
+					<xs:documentation>Som</xs:documentation>
+					<xs:documentation>Kyrgyzstan</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="KHR">
+				<xs:annotation>
+					<xs:documentation>Riel</xs:documentation>
+					<xs:documentation>Cambodia</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="KMF">
+				<xs:annotation>
+					<xs:documentation>Comoro Franc</xs:documentation>
+					<xs:documentation>Comoros</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="KPW">
+				<xs:annotation>
+					<xs:documentation>North Korean Won</xs:documentation>
+					<xs:documentation>Korea (Democratic People’s Republic of)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="KRW">
+				<xs:annotation>
+					<xs:documentation>Won</xs:documentation>
+					<xs:documentation>Korea (Republic of)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="KWD">
+				<xs:annotation>
+					<xs:documentation>Kuwaiti Dinar</xs:documentation>
+					<xs:documentation>Kuwait</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="KYD">
+				<xs:annotation>
+					<xs:documentation>Cayman Islands Dollar</xs:documentation>
+					<xs:documentation>Cayman Islands</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="KZT">
+				<xs:annotation>
+					<xs:documentation>Tenge</xs:documentation>
+					<xs:documentation>Kazakstan</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="LAK">
+				<xs:annotation>
+					<xs:documentation>Kip</xs:documentation>
+					<xs:documentation>Lao People’s Democratic Republic</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="LBP">
+				<xs:annotation>
+					<xs:documentation>Lebanese Pound</xs:documentation>
+					<xs:documentation>Lebanon</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="LKR">
+				<xs:annotation>
+					<xs:documentation>Sri Lanka Rupee</xs:documentation>
+					<xs:documentation>Sri Lanka</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="LRD">
+				<xs:annotation>
+					<xs:documentation>Liberian Dollar</xs:documentation>
+					<xs:documentation>Liberia</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="LSL">
+				<xs:annotation>
+					<xs:documentation>Loti</xs:documentation>
+					<xs:documentation>Lesotho</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="LTL">
+				<xs:annotation>
+					<xs:documentation>Lithuanian Litus</xs:documentation>
+					<xs:documentation>Lithuania</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="LUF">
+				<xs:annotation>
+					<xs:documentation>Luxembourg, Franc</xs:documentation>
+					<xs:documentation>Now replaced by the Euro (EUR): use only for historical prices that pre-date the introduction of the Euro</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="LVL">
+				<xs:annotation>
+					<xs:documentation>Latvian Lats</xs:documentation>
+					<xs:documentation>Latvia</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="LYD">
+				<xs:annotation>
+					<xs:documentation>Libyan Dinar</xs:documentation>
+					<xs:documentation>Libyan Arab Jamahiriya</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MAD">
+				<xs:annotation>
+					<xs:documentation>Moroccan Dirham</xs:documentation>
+					<xs:documentation>Morocco, Western Sahara</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MDL">
+				<xs:annotation>
+					<xs:documentation>Moldovan Leu</xs:documentation>
+					<xs:documentation>Moldova, Republic of</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MGA">
+				<xs:annotation>
+					<xs:documentation>Ariary</xs:documentation>
+					<xs:documentation>Madagascar</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MGF">
+				<xs:annotation>
+					<xs:documentation>Malagasy Franc</xs:documentation>
+					<xs:documentation>Madagascar</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MKD">
+				<xs:annotation>
+					<xs:documentation>Denar</xs:documentation>
+					<xs:documentation>Macedonia (former Yugoslav Republic of)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MMK">
+				<xs:annotation>
+					<xs:documentation>Kyat</xs:documentation>
+					<xs:documentation>Myanmar</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MNT">
+				<xs:annotation>
+					<xs:documentation>Tugrik</xs:documentation>
+					<xs:documentation>Mongolia</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MOP">
+				<xs:annotation>
+					<xs:documentation>Pataca</xs:documentation>
+					<xs:documentation>Macau</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MRO">
+				<xs:annotation>
+					<xs:documentation>Ouguiya</xs:documentation>
+					<xs:documentation>Mauritania</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MTL">
+				<xs:annotation>
+					<xs:documentation>Maltese Lira</xs:documentation>
+					<xs:documentation>Malta</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MUR">
+				<xs:annotation>
+					<xs:documentation>Mauritius Rupee</xs:documentation>
+					<xs:documentation>Mauritius</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MVR">
+				<xs:annotation>
+					<xs:documentation>Rufiyaa</xs:documentation>
+					<xs:documentation>Maldives</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MWK">
+				<xs:annotation>
+					<xs:documentation>Kwacha</xs:documentation>
+					<xs:documentation>Malawi</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MXN">
+				<xs:annotation>
+					<xs:documentation>Mexican Peso</xs:documentation>
+					<xs:documentation>Mexico</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MYR">
+				<xs:annotation>
+					<xs:documentation>Malaysian Ringgit</xs:documentation>
+					<xs:documentation>Malaysia</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MZM">
+				<xs:annotation>
+					<xs:documentation>Metical</xs:documentation>
+					<xs:documentation>Mozambique</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NAD">
+				<xs:annotation>
+					<xs:documentation>Namibia Dollar</xs:documentation>
+					<xs:documentation>Namibia</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NGN">
+				<xs:annotation>
+					<xs:documentation>Naira</xs:documentation>
+					<xs:documentation>Nigeria</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NIO">
+				<xs:annotation>
+					<xs:documentation>Cordoba Oro</xs:documentation>
+					<xs:documentation>Nicaragua</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NLG">
+				<xs:annotation>
+					<xs:documentation>Netherlands, Guilder</xs:documentation>
+					<xs:documentation>Now replaced by the Euro (EUR): use only for historical prices that pre-date the introduction of the Euro</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NOK">
+				<xs:annotation>
+					<xs:documentation>Norwegian Krone</xs:documentation>
+					<xs:documentation>Norway, Bouvet Island, Svalbard and Jan Mayen</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NPR">
+				<xs:annotation>
+					<xs:documentation>Nepalese Rupee</xs:documentation>
+					<xs:documentation>Nepal</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NZD">
+				<xs:annotation>
+					<xs:documentation>New Zealand Dollar</xs:documentation>
+					<xs:documentation>New Zealand, Cook Islands, Niue, Pitcairn, Tokelau</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="OMR">
+				<xs:annotation>
+					<xs:documentation>Rial Omani</xs:documentation>
+					<xs:documentation>Oman</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PAB">
+				<xs:annotation>
+					<xs:documentation>Balboa</xs:documentation>
+					<xs:documentation>Panama</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PEN">
+				<xs:annotation>
+					<xs:documentation>Nuevo Sol</xs:documentation>
+					<xs:documentation>Peru</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PGK">
+				<xs:annotation>
+					<xs:documentation>Kina</xs:documentation>
+					<xs:documentation>Papua New Guinea</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PHP">
+				<xs:annotation>
+					<xs:documentation>Philippine Peso</xs:documentation>
+					<xs:documentation>Philippines</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PKR">
+				<xs:annotation>
+					<xs:documentation>Pakistan Rupee</xs:documentation>
+					<xs:documentation>Pakistan</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PLN">
+				<xs:annotation>
+					<xs:documentation>Zloty</xs:documentation>
+					<xs:documentation>Poland</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PTE">
+				<xs:annotation>
+					<xs:documentation>Portugal, Escudo</xs:documentation>
+					<xs:documentation>Now replaced by the Euro (EUR): use only for historical prices that pre-date the introduction of the Euro</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PYG">
+				<xs:annotation>
+					<xs:documentation>Guarani</xs:documentation>
+					<xs:documentation>Paraguay</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="QAR">
+				<xs:annotation>
+					<xs:documentation>Qatari Rial</xs:documentation>
+					<xs:documentation>Qatar</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ROL">
+				<xs:annotation>
+					<xs:documentation>Leu</xs:documentation>
+					<xs:documentation>Romania</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="RUB">
+				<xs:annotation>
+					<xs:documentation>Russian Ruble</xs:documentation>
+					<xs:documentation>Russian Federation</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="RUR">
+				<xs:annotation>
+					<xs:documentation>Russian Ruble</xs:documentation>
+					<xs:documentation>DEPRECATED, replaced by RUB</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="RWF">
+				<xs:annotation>
+					<xs:documentation>Rwanda Franc</xs:documentation>
+					<xs:documentation>Rwanda</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SAR">
+				<xs:annotation>
+					<xs:documentation>Saudi Riyal</xs:documentation>
+					<xs:documentation>Saudi Arabia</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SBD">
+				<xs:annotation>
+					<xs:documentation>Solomon Islands Dollar</xs:documentation>
+					<xs:documentation>Solomon Islands</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SCR">
+				<xs:annotation>
+					<xs:documentation>Seychelles Rupee</xs:documentation>
+					<xs:documentation>Seychelles</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SDD">
+				<xs:annotation>
+					<xs:documentation>Sudanese Dinar</xs:documentation>
+					<xs:documentation>Sudan</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SEK">
+				<xs:annotation>
+					<xs:documentation>Swedish Krona</xs:documentation>
+					<xs:documentation>Sweden</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SGD">
+				<xs:annotation>
+					<xs:documentation>Singapore Dollar</xs:documentation>
+					<xs:documentation>Singapore</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SHP">
+				<xs:annotation>
+					<xs:documentation>Saint Helena Pound</xs:documentation>
+					<xs:documentation>Saint Helena</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SIT">
+				<xs:annotation>
+					<xs:documentation>Tolar</xs:documentation>
+					<xs:documentation>Slovenia</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SKK">
+				<xs:annotation>
+					<xs:documentation>Slovak Koruna</xs:documentation>
+					<xs:documentation>Slovakia</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SLL">
+				<xs:annotation>
+					<xs:documentation>Leone</xs:documentation>
+					<xs:documentation>Sierra Leone</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SOS">
+				<xs:annotation>
+					<xs:documentation>Somali Shilling</xs:documentation>
+					<xs:documentation>Somalia</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SRD">
+				<xs:annotation>
+					<xs:documentation>Suriname Guilder</xs:documentation>
+					<xs:documentation>Suriname</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SRG">
+				<xs:annotation>
+					<xs:documentation>Suriname Guilder</xs:documentation>
+					<xs:documentation>DEPRECATED, replaced by SRD</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="STD">
+				<xs:annotation>
+					<xs:documentation>Dobra</xs:documentation>
+					<xs:documentation>São Tome and Principe</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SVC">
+				<xs:annotation>
+					<xs:documentation>El Salvador Colon</xs:documentation>
+					<xs:documentation>El Salvador</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SYP">
+				<xs:annotation>
+					<xs:documentation>Syrian Pound</xs:documentation>
+					<xs:documentation>Syrian Arab Republic</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SZL">
+				<xs:annotation>
+					<xs:documentation>Lilangeni</xs:documentation>
+					<xs:documentation>Swaziland</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="THB">
+				<xs:annotation>
+					<xs:documentation>Baht</xs:documentation>
+					<xs:documentation>Thailand</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TJS">
+				<xs:annotation>
+					<xs:documentation>Somoni</xs:documentation>
+					<xs:documentation>Tajikistan</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TMM">
+				<xs:annotation>
+					<xs:documentation>Manat</xs:documentation>
+					<xs:documentation>Turkmenistan</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TND">
+				<xs:annotation>
+					<xs:documentation>Tunisian Dinar</xs:documentation>
+					<xs:documentation>Tunisia</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TOP">
+				<xs:annotation>
+					<xs:documentation>Pa’anga</xs:documentation>
+					<xs:documentation>Tonga</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TPE">
+				<xs:annotation>
+					<xs:documentation>Timor Escudo</xs:documentation>
+					<xs:documentation>East Timor</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TRL">
+				<xs:annotation>
+					<xs:documentation>Turkish Lira (old)</xs:documentation>
+					<xs:documentation>Turkey</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TRY">
+				<xs:annotation>
+					<xs:documentation>Turkish Lira (new)</xs:documentation>
+					<xs:documentation>Turkey, from 1 January 2005</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TTD">
+				<xs:annotation>
+					<xs:documentation>Trinidad and Tobago Dollar</xs:documentation>
+					<xs:documentation>Trinidad and Tobago</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TWD">
+				<xs:annotation>
+					<xs:documentation>New Taiwan Dollar</xs:documentation>
+					<xs:documentation>Taiwan (Province of China)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TZS">
+				<xs:annotation>
+					<xs:documentation>Tanzanian Shilling</xs:documentation>
+					<xs:documentation>Tanzania (United Republic of)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="UAH">
+				<xs:annotation>
+					<xs:documentation>Hryvnia</xs:documentation>
+					<xs:documentation>Ukraine</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="UGX">
+				<xs:annotation>
+					<xs:documentation>Uganda Shilling</xs:documentation>
+					<xs:documentation>Uganda</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="USD">
+				<xs:annotation>
+					<xs:documentation>US Dollar</xs:documentation>
+					<xs:documentation>United States, American Samoa, British Indian Ocean Territory, Ecuador, Guam, Marshall Is, Micronesia (Federated States of), Northern Mariana Is, Palau, Puerto Rico, Turks &amp; Caicos Is, US Minor Outlying Is, Virgin Is (British), Virgin Is (US)</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="UYU">
+				<xs:annotation>
+					<xs:documentation>Peso Uruguayo</xs:documentation>
+					<xs:documentation>Uruguay</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="UZS">
+				<xs:annotation>
+					<xs:documentation>Uzbekistan Sum</xs:documentation>
+					<xs:documentation>Uzbekistan</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="VEB">
+				<xs:annotation>
+					<xs:documentation>Bolivar</xs:documentation>
+					<xs:documentation>Venezuela</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="VND">
+				<xs:annotation>
+					<xs:documentation>Dong</xs:documentation>
+					<xs:documentation>Viet Nam</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="VUV">
+				<xs:annotation>
+					<xs:documentation>Vatu</xs:documentation>
+					<xs:documentation>Vanuatu</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="WST">
+				<xs:annotation>
+					<xs:documentation>Tala</xs:documentation>
+					<xs:documentation>Samoa</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="XAF">
+				<xs:annotation>
+					<xs:documentation>CFA Franc BEAC</xs:documentation>
+					<xs:documentation>Cameroon, Central African Republic, Chad, Congo, Equatorial Guinea, Gabon</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="XCD">
+				<xs:annotation>
+					<xs:documentation>East Caribbean Dollar</xs:documentation>
+					<xs:documentation>Anguilla, Antigua and Barbuda, Dominica, Grenada, Montserrat, Saint Kitts and Nevis, Saint Lucia, Saint Vincent and the Grenadines</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="XOF">
+				<xs:annotation>
+					<xs:documentation>CFA Franc BCEAO</xs:documentation>
+					<xs:documentation>Benin, Burkina Faso, Côte D'Ivoire, Mali, Niger, Senegal, Togo</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="XPF">
+				<xs:annotation>
+					<xs:documentation>CFP Franc</xs:documentation>
+					<xs:documentation>French Polynesia, New Caledonia, Wallis and Futuna</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="YER">
+				<xs:annotation>
+					<xs:documentation>Yemeni Rial</xs:documentation>
+					<xs:documentation>Yemen</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="YUM">
+				<xs:annotation>
+					<xs:documentation>Yugoslavian Dinar</xs:documentation>
+					<xs:documentation>DEPRECATED, replaced by CSD</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ZAR">
+				<xs:annotation>
+					<xs:documentation>Rand</xs:documentation>
+					<xs:documentation>South Africa</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ZMK">
+				<xs:annotation>
+					<xs:documentation>Kwacha</xs:documentation>
+					<xs:documentation>Zambia</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ZWD">
+				<xs:annotation>
+					<xs:documentation>Zimbabwe Dollar</xs:documentation>
+					<xs:documentation>Zimbabwe</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List97">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 97">Bible text feature</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="RL">
+				<xs:annotation>
+					<xs:documentation>Red letter</xs:documentation>
+					<xs:documentation>Words spoken by Christ are printed in red</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List98">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 98">Product form feature value - binding or page edge color</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="BLK">
+				<xs:annotation>
+					<xs:documentation>Black</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BLU">
+				<xs:annotation>
+					<xs:documentation>Blue</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BRN">
+				<xs:annotation>
+					<xs:documentation>Brown</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="BUR">
+				<xs:annotation>
+					<xs:documentation>Burgundy/maroon</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="CRE">
+				<xs:annotation>
+					<xs:documentation>Cream</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GLD">
+				<xs:annotation>
+					<xs:documentation>Gold</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GRN">
+				<xs:annotation>
+					<xs:documentation>Green</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="GRY">
+				<xs:annotation>
+					<xs:documentation>Grey</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="MUL">
+				<xs:annotation>
+					<xs:documentation>Multicolor</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="NAV">
+				<xs:annotation>
+					<xs:documentation>Navy</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ORG">
+				<xs:annotation>
+					<xs:documentation>Orange</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PNK">
+				<xs:annotation>
+					<xs:documentation>Pink</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="PUR">
+				<xs:annotation>
+					<xs:documentation>Purple</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="RED">
+				<xs:annotation>
+					<xs:documentation>Red</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="SLV">
+				<xs:annotation>
+					<xs:documentation>Silver</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="TAN">
+				<xs:annotation>
+					<xs:documentation>Tan</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="WHI">
+				<xs:annotation>
+					<xs:documentation>White</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="YEL">
+				<xs:annotation>
+					<xs:documentation>Yellow</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="ZZZ">
+				<xs:annotation>
+					<xs:documentation>Other</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List99">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 99">Product form feature value - special cover material</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Berkshire leather</xs:documentation>
+					<xs:documentation>Pigskin</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Calfskin</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>French Morocco</xs:documentation>
+					<xs:documentation>Calf split or sheep split</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>Morocco</xs:documentation>
+					<xs:documentation>Goatskin</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="05">
+				<xs:annotation>
+					<xs:documentation>Bonded buffalo grain</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="06">
+				<xs:annotation>
+					<xs:documentation>Bonded calf grain</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="07">
+				<xs:annotation>
+					<xs:documentation>Bonded Cordova</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="08">
+				<xs:annotation>
+					<xs:documentation>Bonded eelskin</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="09">
+				<xs:annotation>
+					<xs:documentation>Bonded Ostraleg</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="10">
+				<xs:annotation>
+					<xs:documentation>Bonded ostrich</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="11">
+				<xs:annotation>
+					<xs:documentation>Bonded reptile grain</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="12">
+				<xs:annotation>
+					<xs:documentation>Bonded leather</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="13">
+				<xs:annotation>
+					<xs:documentation>Cowhide</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="14">
+				<xs:annotation>
+					<xs:documentation>Eelskin</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="15">
+				<xs:annotation>
+					<xs:documentation>Kivar</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="16">
+				<xs:annotation>
+					<xs:documentation>Leatherflex</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="17">
+				<xs:annotation>
+					<xs:documentation>Moleskin</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="18">
+				<xs:annotation>
+					<xs:documentation>Softhide leather</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="19">
+				<xs:annotation>
+					<xs:documentation>Metal</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="20">
+				<xs:annotation>
+					<xs:documentation>Velvet</xs:documentation>
+					<xs:documentation>German 'Samt'</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="21">
+				<xs:annotation>
+					<xs:documentation>Mother-of-pearl</xs:documentation>
+					<xs:documentation>Spanish 'nácar'</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="22">
+				<xs:annotation>
+					<xs:documentation>Papyrus</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="23">
+				<xs:annotation>
+					<xs:documentation>Géltex</xs:documentation>
+					<xs:documentation>An imitation cloth binding material</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="24">
+				<xs:annotation>
+					<xs:documentation>Guaflex</xs:documentation>
+					<xs:documentation>An imitation leather binding material</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List100">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 100">Discount code type</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>BIC discount group code</xs:documentation>
+					<xs:documentation>UK publisher's or distributor's discount group code in a format specified by BIC to ensure uniqueness</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>Proprietary</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="03">
+				<xs:annotation>
+					<xs:documentation>Boeksoort</xs:documentation>
+					<xs:documentation>Terms code used in the Netherlands book trade</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="04">
+				<xs:annotation>
+					<xs:documentation>German terms code</xs:documentation>
+					<xs:documentation>Terms code used in German ONIX applications</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List101">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 101">Person name identifier type</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Proprietary</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>DNB-PND</xs:documentation>
+					<xs:documentation>Deutsche Bibliothek Personennormdatei - person name code of the German national library</xs:documentation>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="List102">
+		<xs:annotation>
+			<xs:documentation source="ONIX Code List 102">Sales outlet identifier type</xs:documentation>
+		</xs:annotation>
+		<xs:restriction base="xs:string">
+			<xs:enumeration value="01">
+				<xs:annotation>
+					<xs:documentation>Proprietary</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+			<xs:enumeration value="02">
+				<xs:annotation>
+					<xs:documentation>BIC sales outlet identifier code</xs:documentation>
+					<xs:documentation/>
+				</xs:annotation>
+			</xs:enumeration>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="SourceTypeCode">
+		<xs:restriction base="List3"/>
+	</xs:simpleType>
+	<xs:simpleType name="TextCaseCode">
+		<xs:restriction base="List14"/>
+	</xs:simpleType>
+	<xs:simpleType name="TextFormatCode">
+		<xs:restriction base="List34"/>
+	</xs:simpleType>
+	<xs:simpleType name="TransliterationCode">
+		<xs:restriction base="xs:string"/>
+	</xs:simpleType>
+</xs:schema>
diff --git a/ia-legacy-importer/onix/ONIX_BookProduct_Release2.1_reference.xsd b/ia-legacy-importer/onix/ONIX_BookProduct_Release2.1_reference.xsd
new file mode 100644
index 00000000..2b93df7e
--- /dev/null
+++ b/ia-legacy-importer/onix/ONIX_BookProduct_Release2.1_reference.xsd
@@ -0,0 +1,6396 @@
+<?xml version="1.0" encoding="UTF-8"?>
+<!--
+**************************************************
+*                                                *
+*               ONIX INTERNATIONAL               *
+*                                                *
+*        ONIX PRODUCT INFORMATION MESSAGE        *
+*                  Version 2.1                   *
+*                  Revision 03                   *
+*                                                *
+*                   XML SCHEMA                   *
+*              REFERENCE TAG VERSION             *
+*                                                *
+*                 Status: RELEASED               *
+*            Release date: 2006-01-31            *
+*                                                *
+*    Original filename: ONIX-INTERNATIONAL.XSD   *
+*                                                *
+*          Original author: Francis Cave         *
+*                                                *
+*             (c) 2004-2006 EDItEUR              *
+*             http://www.editeur.org/            *
+*                                                *
+**************************************************
+
+
+
+TERMS AND CONDITIONS OF USE OF THE ONIX PRODUCT INFORMATION MESSAGE XML SCHEMA
+
+All ONIX standards and documentation are copyright materials, made available 
+free of charge for general use.  If you use the ONIX Product Information 
+Message XML Schema, you will be deemed to have accepted these terms and conditions:
+
+1.  You agree that you will not add to, delete from or amend the ONIX Product 
+Information Message Schema, any part of the Schema except for strictly internal 
+use in your own organisation.
+
+2.  You agree that if you wish to add to, amend, or make extracts of the 
+Schema for any purpose that is not strictly internal to your own organisation, 
+you will in the first instance notify EDItEUR and allow EDItEUR to review 
+and comment on your proposed use, in the interest of securing an orderly 
+development of the Schema for the benefit of other users.
+
+If you do not accept these terms, you must not use the ONIX Product Information 
+Message Schema.
+
+Full copies of the latest release of this Schema and all associated documentation 
+are available from the EDItEUR web site, where may also be found details of 
+how to contact EDItEUR for advice on the use of this Schema. The URL for the 
+EDItEUR web site is:
+
+http://www.editeur.org/
+
+
+
+SCHEMA REVISION HISTORY (IN REVERSE CHRONOLOGICAL ORDER)
+
+2006-01-31: Schema for public release based upon the ONIX for Books DTD
+            Release 2.1 Revision 03
+
+2005-03-16: Schema corrected to eliminate non-deterministic models:
+
+            Detail of changes:
+         1. Element Title removed following TitleOfSeries.
+         2. Element Title removed following TitleOfSet.
+         3. Optional repetitions of element SalesRights removed.
+
+     NOTE - The removal of two instances of the element Title has not been 
+            matched by a corresponding change in the DTD. In this respect 
+            only the functionality of DTD and Schema currently differ. This 
+            difference is to be resolved at the next major Release.
+
+2004-11-10: Schema for public release based upon the ONIX for Books DTD 
+            Release 2.1 Revision 02
+
+2004-08-10: Second Draft Schema based upon the ONIX for Books DTD
+            Release 2.1 Revision 02
+
+2004-02-20: First Draft Schema based upon the ONIX for Books 
+            DTD Release 2.1 Revision 01
+            
+            For earlier revision history, see the DTD.
+
+-->
+<!--W3C Schema generated by XML Spy v4.1 (http://www.xmlspy.com)-->
+<xs:schema xmlns="http://www.editeur.org/onix/2.1/reference" xmlns:xs="http://www.w3.org/2001/XMLSchema" targetNamespace="http://www.editeur.org/onix/2.1/reference" elementFormDefault="qualified" attributeFormDefault="unqualified">
+	<xs:include schemaLocation="ONIX_BookProduct_CodeLists.xsd"/>
+	<xs:include schemaLocation="ONIX_XHTML_Subset.xsd"/>
+	<xs:element name="ONIXMessage">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:choice>
+					<xs:sequence>
+						<xs:choice>
+							<xs:sequence>
+								<xs:element ref="FromEANNumber"/>
+								<xs:element ref="FromSAN" minOccurs="0"/>
+								<xs:element ref="SenderIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+								<xs:element ref="FromCompany" minOccurs="0"/>
+							</xs:sequence>
+							<xs:sequence>
+								<xs:element ref="FromSAN"/>
+								<xs:element ref="SenderIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+								<xs:element ref="FromCompany" minOccurs="0"/>
+							</xs:sequence>
+							<xs:sequence>
+								<xs:element ref="SenderIdentifier" maxOccurs="unbounded"/>
+								<xs:element ref="FromCompany" minOccurs="0"/>
+							</xs:sequence>
+							<xs:element ref="FromCompany"/>
+						</xs:choice>
+						<xs:element ref="FromPerson" minOccurs="0"/>
+						<xs:element ref="FromEmail" minOccurs="0"/>
+						<xs:element ref="ToEANNumber" minOccurs="0"/>
+						<xs:element ref="ToSAN" minOccurs="0"/>
+						<xs:element ref="AddresseeIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+						<xs:element ref="ToCompany" minOccurs="0"/>
+						<xs:element ref="ToPerson" minOccurs="0"/>
+						<xs:element ref="MessageNumber" minOccurs="0"/>
+						<xs:element ref="MessageRepeat" minOccurs="0"/>
+						<xs:element ref="SentDate"/>
+						<xs:element ref="MessageNote" minOccurs="0"/>
+						<xs:element ref="DefaultLanguageOfText" minOccurs="0"/>
+						<xs:element ref="DefaultPriceTypeCode" minOccurs="0"/>
+						<xs:element ref="DefaultCurrencyCode" minOccurs="0"/>
+						<xs:element ref="DefaultLinearUnit" minOccurs="0"/>
+						<xs:element ref="DefaultWeightUnit" minOccurs="0"/>
+						<xs:element ref="DefaultClassOfTrade" minOccurs="0"/>
+					</xs:sequence>
+					<xs:element ref="Header"/>
+				</xs:choice>
+				<xs:choice maxOccurs="unbounded">
+					<xs:element ref="Product"/>
+					<xs:element ref="MainSeriesRecord"/>
+					<xs:element ref="SubSeriesRecord"/>
+				</xs:choice>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ONIXMessage"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="ONIXmessage"/>
+			<xs:attribute name="release" type="xs:string" fixed="2.1"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="AbbreviatedLength">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="AbbreviatedLength"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b276"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="AddresseeIDType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List44">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="AddresseeIDType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="m380"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="AddresseeIdentifier">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="AddresseeIDType"/>
+				<xs:element ref="IDTypeName" minOccurs="0"/>
+				<xs:element ref="IDValue"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="AddresseeIdentifier"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="addresseeidentifier"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Affiliation">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Affiliation"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b046"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="AgentIDType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="AgentIDType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j400"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="AgentIdentifier">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="AgentIDType"/>
+				<xs:element ref="IDTypeName" minOccurs="0"/>
+				<xs:element ref="IDValue"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="AgentIdentifier"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="agentidentifier"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="AgentName">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="AgentName"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j401"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="AgentRole">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="AgentRole"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j402"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="AlternativeFormatEAN13">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="AlternativeFormatEAN13"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="h133"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="AlternativeFormatISBN">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="AlternativeFormatISBN"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="h132"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="AlternativeProductEAN13">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="AlternativeProductEAN13"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="h164"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="AlternativeProductISBN">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="AlternativeProductISBN"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="h163"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Annotation">
+		<xs:complexType mixed="true">
+			<xs:choice minOccurs="0" maxOccurs="unbounded">
+				<xs:element ref="p"/>
+				<xs:element ref="h1"/>
+				<xs:element ref="h2"/>
+				<xs:element ref="h3"/>
+				<xs:element ref="h4"/>
+				<xs:element ref="h5"/>
+				<xs:element ref="h6"/>
+				<xs:element ref="div"/>
+				<xs:element ref="ul"/>
+				<xs:element ref="ol"/>
+				<xs:element ref="dl"/>
+				<xs:element ref="pre"/>
+				<xs:element ref="hr"/>
+				<xs:element ref="blockquote"/>
+				<xs:element ref="address"/>
+				<xs:element ref="table"/>
+				<xs:element ref="a"/>
+				<xs:element ref="br"/>
+				<xs:element ref="span"/>
+				<xs:element ref="bdo"/>
+				<xs:element ref="object"/>
+				<xs:element ref="img"/>
+				<xs:element ref="map"/>
+				<xs:element ref="tt"/>
+				<xs:element ref="i"/>
+				<xs:element ref="b"/>
+				<xs:element ref="big"/>
+				<xs:element ref="small"/>
+				<xs:element ref="em"/>
+				<xs:element ref="strong"/>
+				<xs:element ref="dfn"/>
+				<xs:element ref="code"/>
+				<xs:element ref="q"/>
+				<xs:element ref="sub"/>
+				<xs:element ref="sup"/>
+				<xs:element ref="samp"/>
+				<xs:element ref="kbd"/>
+				<xs:element ref="var"/>
+				<xs:element ref="cite"/>
+				<xs:element ref="abbr"/>
+				<xs:element ref="acronym"/>
+			</xs:choice>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Annotation"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="d100"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="AnnouncementDate">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="AnnouncementDate"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b086"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Audience">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="AudienceCodeType"/>
+				<xs:element ref="AudienceCodeTypeName" minOccurs="0"/>
+				<xs:element ref="AudienceCodeValue"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Audience"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="audience"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="AudienceCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List28">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="AudienceCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b073"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="AudienceCodeType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List29">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="AudienceCodeType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b204"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="AudienceCodeTypeName">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="AudienceCodeTypeName"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b205"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="AudienceCodeValue">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="AudienceCodeValue"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b206"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="AudienceDescription">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="AudienceDescription"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b207"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="AudienceRange">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="AudienceRangeQualifier"/>
+				<xs:element ref="AudienceRangePrecision"/>
+				<xs:element ref="AudienceRangeValue"/>
+				<xs:sequence minOccurs="0">
+					<xs:element ref="AudienceRangePrecision"/>
+					<xs:element ref="AudienceRangeValue"/>
+				</xs:sequence>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="AudienceRange"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="audiencerange"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="AudienceRangePrecision">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List31">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="AudienceRangePrecision"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b075"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="AudienceRangeQualifier">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List30">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="AudienceRangeQualifier"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b074"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="AudienceRangeValue">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="AudienceRangeValue"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b076"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="AudienceRestrictionFlag">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List56">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="AudienceRestrictionFlag"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j146"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="AudienceRestrictionNote">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="AudienceRestrictionNote"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j147"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="AvailabilityCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List54">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="AvailabilityCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j141"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="BASICMainSubject">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="BASICMainSubject"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b064"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="BASICVersion">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="BASICVersion"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b200"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="BICDiscountGroupCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="BICDiscountGroupCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j150"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="BICMainSubject">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="BICMainSubject"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b065"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="BICVersion">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="BICVersion"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b066"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Barcode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List6">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Barcode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b246"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="BatchBonus">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="BatchQuantity"/>
+				<xs:element ref="FreeQuantity"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="BatchBonus"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="batchbonus"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="BatchQuantity">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="BatchQuantity"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j264"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Bible">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="BibleContents" maxOccurs="unbounded"/>
+				<xs:element ref="BibleVersion" maxOccurs="unbounded"/>
+				<xs:element ref="StudyBibleType" minOccurs="0"/>
+				<xs:element ref="BiblePurpose" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="BibleTextOrganization" minOccurs="0"/>
+				<xs:element ref="BibleReferenceLocation" minOccurs="0"/>
+				<xs:element ref="BibleTextFeature" minOccurs="0" maxOccurs="unbounded"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Bible"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="bible"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="BibleContents">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List82">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="BibleContents"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b352"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="BiblePurpose">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List85">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="BiblePurpose"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b354"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="BibleReferenceLocation">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List87">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="BibleReferenceLocation"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b356"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="BibleTextFeature">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List97">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="BibleTextFeature"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b357"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="BibleTextOrganization">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List86">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="BibleTextOrganization"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b355"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="BibleVersion">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List83">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="BibleVersion"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b353"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="BiographicalNote">
+		<xs:complexType mixed="true">
+			<xs:choice minOccurs="0" maxOccurs="unbounded">
+				<xs:element ref="p"/>
+				<xs:element ref="h1"/>
+				<xs:element ref="h2"/>
+				<xs:element ref="h3"/>
+				<xs:element ref="h4"/>
+				<xs:element ref="h5"/>
+				<xs:element ref="h6"/>
+				<xs:element ref="div"/>
+				<xs:element ref="ul"/>
+				<xs:element ref="ol"/>
+				<xs:element ref="dl"/>
+				<xs:element ref="pre"/>
+				<xs:element ref="hr"/>
+				<xs:element ref="blockquote"/>
+				<xs:element ref="address"/>
+				<xs:element ref="table"/>
+				<xs:element ref="a"/>
+				<xs:element ref="br"/>
+				<xs:element ref="span"/>
+				<xs:element ref="bdo"/>
+				<xs:element ref="object"/>
+				<xs:element ref="img"/>
+				<xs:element ref="map"/>
+				<xs:element ref="tt"/>
+				<xs:element ref="i"/>
+				<xs:element ref="b"/>
+				<xs:element ref="big"/>
+				<xs:element ref="small"/>
+				<xs:element ref="em"/>
+				<xs:element ref="strong"/>
+				<xs:element ref="dfn"/>
+				<xs:element ref="code"/>
+				<xs:element ref="q"/>
+				<xs:element ref="sub"/>
+				<xs:element ref="sup"/>
+				<xs:element ref="samp"/>
+				<xs:element ref="kbd"/>
+				<xs:element ref="var"/>
+				<xs:element ref="cite"/>
+				<xs:element ref="abbr"/>
+				<xs:element ref="acronym"/>
+			</xs:choice>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="BiographicalNote"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b044"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="BookClubAdoption">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="BookClubAdoption"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="k169"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="BookFormDetail">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List8">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="BookFormDetail"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b013"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="CBO">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="CBO"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j375"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="CityOfPublication">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="CityOfPublication"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b209"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ClassOfTrade">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ClassOfTrade"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j149"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Complexity">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="ComplexitySchemeIdentifier"/>
+				<xs:element ref="ComplexityCode"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Complexity"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="complexity"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ComplexityCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ComplexityCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b078"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ComplexitySchemeIdentifier">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List32">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ComplexitySchemeIdentifier"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b077"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ComponentNumber">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ComponentNumber"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b289"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ComponentTypeName">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ComponentTypeName"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b288"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Conference">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="ConferenceRole" minOccurs="0"/>
+				<xs:element ref="ConferenceName"/>
+				<xs:element ref="ConferenceAcronym" minOccurs="0"/>
+				<xs:element ref="ConferenceNumber" minOccurs="0"/>
+				<xs:element ref="ConferenceTheme" minOccurs="0"/>
+				<xs:element ref="ConferenceDate" minOccurs="0"/>
+				<xs:element ref="ConferencePlace" minOccurs="0"/>
+				<xs:element ref="ConferenceSponsor" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="Website" minOccurs="0" maxOccurs="unbounded"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Conference"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="conference"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ConferenceAcronym">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ConferenceAcronym"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b341"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ConferenceDate">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ConferenceDate"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b054"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ConferenceDescription">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ConferenceDescription"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b050"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ConferenceName">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ConferenceName"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b052"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ConferenceNumber">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ConferenceNumber"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b053"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ConferencePlace">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ConferencePlace"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b055"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ConferenceRole">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List20">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ConferenceRole"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b051"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ConferenceSponsor">
+		<xs:complexType>
+			<xs:choice>
+				<xs:sequence>
+					<xs:element ref="ConferenceSponsorIdentifier"/>
+					<xs:choice minOccurs="0">
+						<xs:element ref="PersonName"/>
+						<xs:element ref="CorporateName"/>
+					</xs:choice>
+				</xs:sequence>
+				<xs:element ref="PersonName"/>
+				<xs:element ref="CorporateName"/>
+			</xs:choice>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ConferenceSponsor"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="conferencesponsor"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ConferenceSponsorIDType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List44">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ConferenceSponsorIDType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b391"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ConferenceSponsorIdentifier">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="ConferenceSponsorIDType"/>
+				<xs:element ref="IDTypeName" minOccurs="0"/>
+				<xs:element ref="IDValue"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ConferenceSponsorIdentifier"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="conferencesponsoridentifier"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ConferenceTheme">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ConferenceTheme"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b342"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ContainedItem">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:choice>
+					<xs:sequence>
+						<xs:element ref="ISBN"/>
+						<xs:element ref="EAN13" minOccurs="0"/>
+						<xs:element ref="ProductIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+						<xs:sequence minOccurs="0">
+							<xs:element ref="ProductForm"/>
+							<xs:element ref="ProductFormDetail" minOccurs="0" maxOccurs="unbounded"/>
+							<xs:element ref="ProductFormFeature" minOccurs="0" maxOccurs="unbounded"/>
+							<xs:element ref="BookFormDetail" minOccurs="0" maxOccurs="unbounded"/>
+							<xs:element ref="ProductPackaging" minOccurs="0"/>
+							<xs:element ref="ProductFormDescription" minOccurs="0"/>
+						</xs:sequence>
+					</xs:sequence>
+					<xs:sequence>
+						<xs:element ref="EAN13"/>
+						<xs:element ref="ProductIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+						<xs:sequence minOccurs="0">
+							<xs:element ref="ProductForm"/>
+							<xs:element ref="ProductFormDetail" minOccurs="0" maxOccurs="unbounded"/>
+							<xs:element ref="ProductFormFeature" minOccurs="0" maxOccurs="unbounded"/>
+							<xs:element ref="BookFormDetail" minOccurs="0" maxOccurs="unbounded"/>
+							<xs:element ref="ProductPackaging" minOccurs="0"/>
+							<xs:element ref="ProductFormDescription" minOccurs="0"/>
+						</xs:sequence>
+					</xs:sequence>
+					<xs:sequence>
+						<xs:element ref="ProductIdentifier" maxOccurs="unbounded"/>
+						<xs:sequence minOccurs="0">
+							<xs:element ref="ProductForm"/>
+							<xs:element ref="ProductFormDetail" minOccurs="0" maxOccurs="unbounded"/>
+							<xs:element ref="ProductFormFeature" minOccurs="0" maxOccurs="unbounded"/>
+							<xs:element ref="BookFormDetail" minOccurs="0" maxOccurs="unbounded"/>
+							<xs:element ref="ProductPackaging" minOccurs="0"/>
+							<xs:element ref="ProductFormDescription" minOccurs="0"/>
+						</xs:sequence>
+					</xs:sequence>
+					<xs:sequence>
+						<xs:element ref="ProductForm"/>
+						<xs:element ref="ProductFormDetail" minOccurs="0" maxOccurs="unbounded"/>
+						<xs:element ref="ProductFormFeature" minOccurs="0" maxOccurs="unbounded"/>
+						<xs:element ref="BookFormDetail" minOccurs="0" maxOccurs="unbounded"/>
+						<xs:element ref="ProductPackaging" minOccurs="0"/>
+						<xs:element ref="ProductFormDescription" minOccurs="0"/>
+					</xs:sequence>
+				</xs:choice>
+				<xs:element ref="NumberOfPieces" minOccurs="0"/>
+				<xs:element ref="TradeCategory" minOccurs="0"/>
+				<xs:element ref="ProductContentType" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="ItemQuantity" minOccurs="0"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ContainedItem"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="containeditem"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ContentItem">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="LevelSequenceNumber" minOccurs="0"/>
+				<xs:element ref="TextItem"/>
+				<xs:element ref="Website" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:choice>
+					<xs:sequence>
+						<xs:element ref="ComponentTypeName"/>
+						<xs:element ref="ComponentNumber" minOccurs="0"/>
+						<xs:element ref="DistinctiveTitle" minOccurs="0"/>
+						<xs:element ref="Title" minOccurs="0" maxOccurs="unbounded"/>
+					</xs:sequence>
+					<xs:sequence>
+						<xs:element ref="ComponentNumber"/>
+						<xs:element ref="DistinctiveTitle" minOccurs="0"/>
+						<xs:element ref="Title" minOccurs="0" maxOccurs="unbounded"/>
+					</xs:sequence>
+					<xs:sequence>
+						<xs:element ref="DistinctiveTitle"/>
+						<xs:element ref="Title" minOccurs="0" maxOccurs="unbounded"/>
+					</xs:sequence>
+					<xs:element ref="Title" maxOccurs="unbounded"/>
+				</xs:choice>
+				<xs:element ref="WorkIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:sequence minOccurs="0">
+					<xs:element ref="Contributor" maxOccurs="unbounded"/>
+					<xs:element ref="ContributorStatement" minOccurs="0"/>
+				</xs:sequence>
+				<xs:element ref="Subject" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="PersonAsSubject" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="CorporateBodyAsSubject" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="PlaceAsSubject" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="OtherText" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="MediaFile" minOccurs="0" maxOccurs="unbounded"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ContentItem"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="contentitem"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Contributor">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="SequenceNumber" minOccurs="0"/>
+				<xs:element ref="ContributorRole"/>
+				<xs:element ref="LanguageCode" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:choice minOccurs="0">
+					<xs:element ref="SequenceNumberWithinRole"/>
+					<xs:sequence maxOccurs="unbounded">
+						<xs:element ref="ContributorRole"/>
+						<xs:element ref="LanguageCode" minOccurs="0" maxOccurs="unbounded"/>
+					</xs:sequence>
+				</xs:choice>
+				<xs:choice>
+					<xs:sequence>
+						<xs:choice>
+							<xs:sequence>
+								<xs:choice>
+									<xs:sequence>
+										<xs:element ref="PersonName"/>
+										<xs:element ref="PersonNameInverted" minOccurs="0"/>
+										<xs:sequence minOccurs="0">
+											<xs:element ref="TitlesBeforeNames" minOccurs="0"/>
+											<xs:element ref="NamesBeforeKey" minOccurs="0"/>
+											<xs:element ref="PrefixToKey" minOccurs="0"/>
+											<xs:element ref="KeyNames"/>
+											<xs:element ref="NamesAfterKey" minOccurs="0"/>
+											<xs:element ref="SuffixToKey" minOccurs="0"/>
+											<xs:element ref="LettersAfterNames" minOccurs="0"/>
+											<xs:element ref="TitlesAfterNames" minOccurs="0"/>
+										</xs:sequence>
+										<xs:element ref="Name" minOccurs="0" maxOccurs="unbounded"/>
+										<xs:element ref="PersonNameIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+									</xs:sequence>
+									<xs:sequence>
+										<xs:element ref="PersonNameInverted"/>
+										<xs:sequence minOccurs="0">
+											<xs:element ref="TitlesBeforeNames" minOccurs="0"/>
+											<xs:element ref="NamesBeforeKey" minOccurs="0"/>
+											<xs:element ref="PrefixToKey" minOccurs="0"/>
+											<xs:element ref="KeyNames"/>
+											<xs:element ref="NamesAfterKey" minOccurs="0"/>
+											<xs:element ref="SuffixToKey" minOccurs="0"/>
+											<xs:element ref="LettersAfterNames" minOccurs="0"/>
+											<xs:element ref="TitlesAfterNames" minOccurs="0"/>
+										</xs:sequence>
+										<xs:element ref="Name" minOccurs="0" maxOccurs="unbounded"/>
+										<xs:element ref="PersonNameIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+									</xs:sequence>
+									<xs:sequence>
+										<xs:element ref="TitlesBeforeNames" minOccurs="0"/>
+										<xs:element ref="NamesBeforeKey" minOccurs="0"/>
+										<xs:element ref="PrefixToKey" minOccurs="0"/>
+										<xs:element ref="KeyNames"/>
+										<xs:element ref="NamesAfterKey" minOccurs="0"/>
+										<xs:element ref="SuffixToKey" minOccurs="0"/>
+										<xs:element ref="LettersAfterNames" minOccurs="0"/>
+										<xs:element ref="TitlesAfterNames" minOccurs="0"/>
+										<xs:element ref="Name" minOccurs="0" maxOccurs="unbounded"/>
+										<xs:element ref="PersonNameIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+									</xs:sequence>
+									<xs:sequence>
+										<xs:element ref="Name" maxOccurs="unbounded"/>
+										<xs:element ref="PersonNameIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+									</xs:sequence>
+									<xs:element ref="PersonNameIdentifier" maxOccurs="unbounded"/>
+								</xs:choice>
+								<xs:element ref="PersonDate" minOccurs="0" maxOccurs="unbounded"/>
+								<xs:element ref="ProfessionalAffiliation" minOccurs="0" maxOccurs="unbounded"/>
+							</xs:sequence>
+							<xs:element ref="CorporateName"/>
+						</xs:choice>
+						<xs:element ref="BiographicalNote" minOccurs="0"/>
+						<xs:element ref="Website" minOccurs="0" maxOccurs="unbounded"/>
+						<xs:element ref="ProfessionalPosition" minOccurs="0"/>
+						<xs:element ref="Affiliation" minOccurs="0"/>
+						<xs:element ref="ContributorDescription" minOccurs="0"/>
+					</xs:sequence>
+					<xs:element ref="UnnamedPersons"/>
+				</xs:choice>
+				<xs:element ref="CountryCode" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="RegionCode" minOccurs="0" maxOccurs="unbounded"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Contributor"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="contributor"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ContributorDescription">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ContributorDescription"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b048"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ContributorRole">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List17">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ContributorRole"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b035"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ContributorStatement">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ContributorStatement"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b049"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="CopiesSold">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="CopiesSold"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="k168"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="CopublisherName">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="CopublisherName"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b084"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="CopyrightOwner">
+		<xs:complexType>
+			<xs:choice>
+				<xs:sequence>
+					<xs:element ref="CopyrightOwnerIdentifier"/>
+					<xs:choice minOccurs="0">
+						<xs:element ref="PersonName"/>
+						<xs:element ref="CorporateName"/>
+					</xs:choice>
+				</xs:sequence>
+				<xs:element ref="PersonName"/>
+				<xs:element ref="CorporateName"/>
+			</xs:choice>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="CopyrightOwner"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="copyrightowner"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="CopyrightOwnerIDType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List44">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="CopyrightOwnerIDType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b392"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="CopyrightOwnerIdentifier">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="CopyrightOwnerIDType"/>
+				<xs:element ref="IDTypeName" minOccurs="0"/>
+				<xs:element ref="IDValue"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="CopyrightOwnerIdentifier"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="copyrightowneridentifier"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="CopyrightStatement">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="CopyrightYear" maxOccurs="unbounded"/>
+				<xs:element ref="CopyrightOwner" maxOccurs="unbounded"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="CopyrightStatement"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="copyrightstatement"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="CopyrightYear">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="CopyrightYear"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b087"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="CorporateBodyAsSubject">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="CorporateBodyAsSubject"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b071"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="CorporateName">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="CorporateName"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b047"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="CountryCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List91">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="CountryCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b251"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="CountryExcluded">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="CountryCodeList">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="CountryExcluded"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j304"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="CountryOfPublication">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List91">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="CountryOfPublication"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b083"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="CoverImageFormatCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List36">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="CoverImageFormatCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="f111"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="CoverImageLink">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="CoverImageLink"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="f113"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="CoverImageLinkTypeCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List37">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="CoverImageLinkTypeCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="f112"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="CurrencyCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List96">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="CurrencyCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j152"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="DOI">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="DOI"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b009"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Date">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Date"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b306"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="DateFormat">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List55">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="DateFormat"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j260"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="DefaultClassOfTrade">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="DefaultClassOfTrade"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="m193"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="DefaultCurrencyCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List96">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="DefaultCurrencyCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="m186"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="DefaultLanguageOfText">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List74">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="DefaultLanguageOfText"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="m184"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="DefaultLinearUnit">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List94">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="DefaultLinearUnit"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="m187"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="DefaultPriceTypeCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List58">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="DefaultPriceTypeCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="m185"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="DefaultWeightUnit">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List95">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="DefaultWeightUnit"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="m188"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="DeletionCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List2">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="DeletionCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="a198"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="DeletionText">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="DeletionText"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="a199"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Dimensions">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Dimensions"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="c258"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="DiscountCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="DiscountCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j364"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="DiscountCodeType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List100">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="DiscountCodeType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j363"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="DiscountCodeTypeName">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="DiscountCodeTypeName"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j378"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="DiscountCoded">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="DiscountCodeType"/>
+				<xs:element ref="DiscountCodeTypeName" minOccurs="0"/>
+				<xs:element ref="DiscountCode"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="DiscountCoded"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="discountcoded"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="DiscountPercent">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="DiscountPercent"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j267"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="DistinctiveTitle">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="DistinctiveTitle"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b028"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="DownloadCaption">
+		<xs:complexType mixed="true">
+			<xs:choice minOccurs="0" maxOccurs="unbounded">
+				<xs:element ref="p"/>
+				<xs:element ref="h1"/>
+				<xs:element ref="h2"/>
+				<xs:element ref="h3"/>
+				<xs:element ref="h4"/>
+				<xs:element ref="h5"/>
+				<xs:element ref="h6"/>
+				<xs:element ref="div"/>
+				<xs:element ref="ul"/>
+				<xs:element ref="ol"/>
+				<xs:element ref="dl"/>
+				<xs:element ref="pre"/>
+				<xs:element ref="hr"/>
+				<xs:element ref="blockquote"/>
+				<xs:element ref="address"/>
+				<xs:element ref="table"/>
+				<xs:element ref="a"/>
+				<xs:element ref="br"/>
+				<xs:element ref="span"/>
+				<xs:element ref="bdo"/>
+				<xs:element ref="object"/>
+				<xs:element ref="img"/>
+				<xs:element ref="map"/>
+				<xs:element ref="tt"/>
+				<xs:element ref="i"/>
+				<xs:element ref="b"/>
+				<xs:element ref="big"/>
+				<xs:element ref="small"/>
+				<xs:element ref="em"/>
+				<xs:element ref="strong"/>
+				<xs:element ref="dfn"/>
+				<xs:element ref="code"/>
+				<xs:element ref="q"/>
+				<xs:element ref="sub"/>
+				<xs:element ref="sup"/>
+				<xs:element ref="samp"/>
+				<xs:element ref="kbd"/>
+				<xs:element ref="var"/>
+				<xs:element ref="cite"/>
+				<xs:element ref="abbr"/>
+				<xs:element ref="acronym"/>
+			</xs:choice>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="DownloadCaption"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="f119"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="DownloadCopyrightNotice">
+		<xs:complexType mixed="true">
+			<xs:choice minOccurs="0" maxOccurs="unbounded">
+				<xs:element ref="p"/>
+				<xs:element ref="h1"/>
+				<xs:element ref="h2"/>
+				<xs:element ref="h3"/>
+				<xs:element ref="h4"/>
+				<xs:element ref="h5"/>
+				<xs:element ref="h6"/>
+				<xs:element ref="div"/>
+				<xs:element ref="ul"/>
+				<xs:element ref="ol"/>
+				<xs:element ref="dl"/>
+				<xs:element ref="pre"/>
+				<xs:element ref="hr"/>
+				<xs:element ref="blockquote"/>
+				<xs:element ref="address"/>
+				<xs:element ref="table"/>
+				<xs:element ref="a"/>
+				<xs:element ref="br"/>
+				<xs:element ref="span"/>
+				<xs:element ref="bdo"/>
+				<xs:element ref="object"/>
+				<xs:element ref="img"/>
+				<xs:element ref="map"/>
+				<xs:element ref="tt"/>
+				<xs:element ref="i"/>
+				<xs:element ref="b"/>
+				<xs:element ref="big"/>
+				<xs:element ref="small"/>
+				<xs:element ref="em"/>
+				<xs:element ref="strong"/>
+				<xs:element ref="dfn"/>
+				<xs:element ref="code"/>
+				<xs:element ref="q"/>
+				<xs:element ref="sub"/>
+				<xs:element ref="sup"/>
+				<xs:element ref="samp"/>
+				<xs:element ref="kbd"/>
+				<xs:element ref="var"/>
+				<xs:element ref="cite"/>
+				<xs:element ref="abbr"/>
+				<xs:element ref="acronym"/>
+			</xs:choice>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="DownloadCopyrightNotice"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="f121"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="DownloadCredit">
+		<xs:complexType mixed="true">
+			<xs:choice minOccurs="0" maxOccurs="unbounded">
+				<xs:element ref="p"/>
+				<xs:element ref="h1"/>
+				<xs:element ref="h2"/>
+				<xs:element ref="h3"/>
+				<xs:element ref="h4"/>
+				<xs:element ref="h5"/>
+				<xs:element ref="h6"/>
+				<xs:element ref="div"/>
+				<xs:element ref="ul"/>
+				<xs:element ref="ol"/>
+				<xs:element ref="dl"/>
+				<xs:element ref="pre"/>
+				<xs:element ref="hr"/>
+				<xs:element ref="blockquote"/>
+				<xs:element ref="address"/>
+				<xs:element ref="table"/>
+				<xs:element ref="a"/>
+				<xs:element ref="br"/>
+				<xs:element ref="span"/>
+				<xs:element ref="bdo"/>
+				<xs:element ref="object"/>
+				<xs:element ref="img"/>
+				<xs:element ref="map"/>
+				<xs:element ref="tt"/>
+				<xs:element ref="i"/>
+				<xs:element ref="b"/>
+				<xs:element ref="big"/>
+				<xs:element ref="small"/>
+				<xs:element ref="em"/>
+				<xs:element ref="strong"/>
+				<xs:element ref="dfn"/>
+				<xs:element ref="code"/>
+				<xs:element ref="q"/>
+				<xs:element ref="sub"/>
+				<xs:element ref="sup"/>
+				<xs:element ref="samp"/>
+				<xs:element ref="kbd"/>
+				<xs:element ref="var"/>
+				<xs:element ref="cite"/>
+				<xs:element ref="abbr"/>
+				<xs:element ref="acronym"/>
+			</xs:choice>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="DownloadCredit"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="f120"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="DownloadTerms">
+		<xs:complexType mixed="true">
+			<xs:choice minOccurs="0" maxOccurs="unbounded">
+				<xs:element ref="p"/>
+				<xs:element ref="h1"/>
+				<xs:element ref="h2"/>
+				<xs:element ref="h3"/>
+				<xs:element ref="h4"/>
+				<xs:element ref="h5"/>
+				<xs:element ref="h6"/>
+				<xs:element ref="div"/>
+				<xs:element ref="ul"/>
+				<xs:element ref="ol"/>
+				<xs:element ref="dl"/>
+				<xs:element ref="pre"/>
+				<xs:element ref="hr"/>
+				<xs:element ref="blockquote"/>
+				<xs:element ref="address"/>
+				<xs:element ref="table"/>
+				<xs:element ref="a"/>
+				<xs:element ref="br"/>
+				<xs:element ref="span"/>
+				<xs:element ref="bdo"/>
+				<xs:element ref="object"/>
+				<xs:element ref="img"/>
+				<xs:element ref="map"/>
+				<xs:element ref="tt"/>
+				<xs:element ref="i"/>
+				<xs:element ref="b"/>
+				<xs:element ref="big"/>
+				<xs:element ref="small"/>
+				<xs:element ref="em"/>
+				<xs:element ref="strong"/>
+				<xs:element ref="dfn"/>
+				<xs:element ref="code"/>
+				<xs:element ref="q"/>
+				<xs:element ref="sub"/>
+				<xs:element ref="sup"/>
+				<xs:element ref="samp"/>
+				<xs:element ref="kbd"/>
+				<xs:element ref="var"/>
+				<xs:element ref="cite"/>
+				<xs:element ref="abbr"/>
+				<xs:element ref="acronym"/>
+			</xs:choice>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="DownloadTerms"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="f122"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="EAN13">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="EAN13"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b005"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="EAN13OfSet">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="EAN13OfSet"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b022"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="EditionNumber">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="EditionNumber"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b057"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="EditionStatement">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="EditionStatement"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b058"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="EditionTypeCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List21">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="EditionTypeCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b056"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="EditionVersionNumber">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="EditionVersionNumber"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b217"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="EmailAddress">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="EmailAddress"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j272"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="EndDate">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="EndDate"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b325"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="EpubFormat">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List11">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="EpubFormat"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b214"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="EpubFormatDescription">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="EpubFormatDescription"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b216"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="EpubFormatVersion">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="EpubFormatVersion"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b215"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="EpubSource">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List11">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="EpubSource"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b278"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="EpubSourceDescription">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="EpubSourceDescription"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b280"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="EpubSourceVersion">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="EpubSourceVersion"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b279"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="EpubType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List10">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="EpubType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b211"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="EpubTypeDescription">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="EpubTypeDescription"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b213"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="EpubTypeNote">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="EpubTypeNote"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b277"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="EpubTypeVersion">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="EpubTypeVersion"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b212"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ExpectedDate">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ExpectedDate"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j302"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ExpectedShipDate">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ExpectedShipDate"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j142"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Extent">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="ExtentType"/>
+				<xs:element ref="ExtentValue"/>
+				<xs:element ref="ExtentUnit"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Extent"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="extent"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ExtentType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List23">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ExtentType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b218"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ExtentUnit">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List24">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ExtentUnit"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b220"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ExtentValue">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ExtentValue"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b219"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="FaxNumber">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="FaxNumber"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j271"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="FirstPageNumber">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="FirstPageNumber"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b286"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="FormerTitle">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="FormerTitle"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b033"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="FreeQuantity">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="FreeQuantity"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j265"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="FromCompany">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="FromCompany"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="m174"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="FromEANNumber">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="FromEANNumber"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="m172"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="FromEmail">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="FromEmail"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="m283"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="FromPerson">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="FromPerson"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="m175"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="FromSAN">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="FromSAN"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="m173"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Header">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:choice>
+					<xs:sequence>
+						<xs:element ref="FromEANNumber"/>
+						<xs:element ref="FromSAN" minOccurs="0"/>
+						<xs:element ref="SenderIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+						<xs:element ref="FromCompany" minOccurs="0"/>
+					</xs:sequence>
+					<xs:sequence>
+						<xs:element ref="FromSAN"/>
+						<xs:element ref="SenderIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+						<xs:element ref="FromCompany" minOccurs="0"/>
+					</xs:sequence>
+					<xs:sequence>
+						<xs:element ref="SenderIdentifier" maxOccurs="unbounded"/>
+						<xs:element ref="FromCompany" minOccurs="0"/>
+					</xs:sequence>
+					<xs:element ref="FromCompany"/>
+				</xs:choice>
+				<xs:element ref="FromPerson" minOccurs="0"/>
+				<xs:element ref="FromEmail" minOccurs="0"/>
+				<xs:element ref="ToEANNumber" minOccurs="0"/>
+				<xs:element ref="ToSAN" minOccurs="0"/>
+				<xs:element ref="AddresseeIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="ToCompany" minOccurs="0"/>
+				<xs:element ref="ToPerson" minOccurs="0"/>
+				<xs:element ref="MessageNumber" minOccurs="0"/>
+				<xs:element ref="MessageRepeat" minOccurs="0"/>
+				<xs:element ref="SentDate"/>
+				<xs:element ref="MessageNote" minOccurs="0"/>
+				<xs:element ref="DefaultLanguageOfText" minOccurs="0"/>
+				<xs:element ref="DefaultPriceTypeCode" minOccurs="0"/>
+				<xs:element ref="DefaultCurrencyCode" minOccurs="0"/>
+				<xs:element ref="DefaultLinearUnit" minOccurs="0"/>
+				<xs:element ref="DefaultWeightUnit" minOccurs="0"/>
+				<xs:element ref="DefaultClassOfTrade" minOccurs="0"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Header"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="header"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Height">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Height"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="c096"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="IDTypeName">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="IDTypeName"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b233"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="IDValue">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="IDValue"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b244"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ISBN">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ISBN"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b004"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ISBNOfSet">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ISBNOfSet"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b021"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ISMN">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ISMN"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b008"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="IllustrationType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List25">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="IllustrationType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b256"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="IllustrationTypeDescription">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="IllustrationTypeDescription"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b361"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Illustrations">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="IllustrationType"/>
+				<xs:element ref="IllustrationTypeDescription" minOccurs="0"/>
+				<xs:element ref="Number" minOccurs="0"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Illustrations"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="illustrations"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="IllustrationsNote">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="IllustrationsNote"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b062"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ImageResolution">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ImageResolution"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="f259"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Imprint">
+		<xs:complexType>
+			<xs:choice>
+				<xs:element ref="ImprintName"/>
+				<xs:sequence>
+					<xs:element ref="NameCodeType"/>
+					<xs:element ref="NameCodeTypeName" minOccurs="0"/>
+					<xs:element ref="NameCodeValue"/>
+					<xs:element ref="ImprintName" minOccurs="0"/>
+				</xs:sequence>
+			</xs:choice>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Imprint"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="imprint"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ImprintName">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ImprintName"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b079"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="InitialPrintRun">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="InitialPrintRun"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="k167"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="InterestAge">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="InterestAge"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b190"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="IntermediaryAvailabilityCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List63">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="IntermediaryAvailabilityCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j348"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ItemNumberWithinSet">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ItemNumberWithinSet"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b026"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ItemQuantity">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ItemQuantity"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b015"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="KeyNames">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="KeyNames"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b040"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Language">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="LanguageRole"/>
+				<xs:element ref="LanguageCode"/>
+				<xs:element ref="CountryCode" minOccurs="0"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Language"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="language"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="LanguageCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List74">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="LanguageCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b252"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="LanguageOfText">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List74">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="LanguageOfText"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b059"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="LanguageRole">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List22">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="LanguageRole"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b253"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="LastDateForReturns">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="LastDateForReturns"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j387"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="LastPageNumber">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="LastPageNumber"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b287"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="LettersAfterNames">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="LettersAfterNames"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b042"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="LevelSequenceNumber">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="LevelSequenceNumber"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b284"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="LocationIDType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List92">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="LocationIDType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j377"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="LocationIdentifier">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="LocationIDType"/>
+				<xs:element ref="IDTypeName" minOccurs="0"/>
+				<xs:element ref="IDValue"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="LocationIdentifier"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="locationidentifier"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="LocationName">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="LocationName"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j349"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="MainDescription">
+		<xs:complexType mixed="true">
+			<xs:choice minOccurs="0" maxOccurs="unbounded">
+				<xs:element ref="p"/>
+				<xs:element ref="h1"/>
+				<xs:element ref="h2"/>
+				<xs:element ref="h3"/>
+				<xs:element ref="h4"/>
+				<xs:element ref="h5"/>
+				<xs:element ref="h6"/>
+				<xs:element ref="div"/>
+				<xs:element ref="ul"/>
+				<xs:element ref="ol"/>
+				<xs:element ref="dl"/>
+				<xs:element ref="pre"/>
+				<xs:element ref="hr"/>
+				<xs:element ref="blockquote"/>
+				<xs:element ref="address"/>
+				<xs:element ref="table"/>
+				<xs:element ref="a"/>
+				<xs:element ref="br"/>
+				<xs:element ref="span"/>
+				<xs:element ref="bdo"/>
+				<xs:element ref="object"/>
+				<xs:element ref="img"/>
+				<xs:element ref="map"/>
+				<xs:element ref="tt"/>
+				<xs:element ref="i"/>
+				<xs:element ref="b"/>
+				<xs:element ref="big"/>
+				<xs:element ref="small"/>
+				<xs:element ref="em"/>
+				<xs:element ref="strong"/>
+				<xs:element ref="dfn"/>
+				<xs:element ref="code"/>
+				<xs:element ref="q"/>
+				<xs:element ref="sub"/>
+				<xs:element ref="sup"/>
+				<xs:element ref="samp"/>
+				<xs:element ref="kbd"/>
+				<xs:element ref="var"/>
+				<xs:element ref="cite"/>
+				<xs:element ref="abbr"/>
+				<xs:element ref="acronym"/>
+			</xs:choice>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="MainDescription"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="d101"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="MainSeriesRecord">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="RecordReference"/>
+				<xs:element ref="NotificationType"/>
+				<xs:element ref="DeletionCode" minOccurs="0"/>
+				<xs:element ref="DeletionText" minOccurs="0"/>
+				<xs:element ref="RecordSourceType" minOccurs="0"/>
+				<xs:sequence minOccurs="0">
+					<xs:element ref="RecordSourceIdentifierType"/>
+					<xs:element ref="RecordSourceIdentifier"/>
+				</xs:sequence>
+				<xs:element ref="RecordSourceName" minOccurs="0"/>
+				<xs:element ref="SeriesIdentifier" maxOccurs="unbounded"/>
+				<xs:element ref="Title" maxOccurs="unbounded"/>
+				<xs:element ref="Contributor" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="OtherText" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="Publisher" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="SubordinateEntries" minOccurs="0"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="MainSeriesRecord"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="mainseriesrecord"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="MainSubject">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="MainSubjectSchemeIdentifier"/>
+				<xs:element ref="SubjectSchemeVersion" minOccurs="0"/>
+				<xs:choice>
+					<xs:sequence>
+						<xs:element ref="SubjectCode"/>
+						<xs:element ref="SubjectHeadingText" minOccurs="0"/>
+					</xs:sequence>
+					<xs:element ref="SubjectHeadingText"/>
+				</xs:choice>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="MainSubject"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="mainsubject"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="MainSubjectSchemeIdentifier">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List26">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="MainSubjectSchemeIdentifier"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b191"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="MapScale">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="MapScale"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b063"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="MarketCountry">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="MarketCountry"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j403"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="MarketCountryExcluded">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="MarketCountryExcluded"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j405"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="MarketDate">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="MarketDateRole"/>
+				<xs:element ref="DateFormat" minOccurs="0"/>
+				<xs:element ref="Date"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="MarketDate"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="marketdate"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="MarketDateRole">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="MarketDateRole"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j408"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="MarketPublishingStatus">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="MarketPublishingStatus"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j407"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="MarketRepresentation">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:choice>
+					<xs:sequence>
+						<xs:element ref="AgentIdentifier" maxOccurs="unbounded"/>
+						<xs:element ref="AgentName" minOccurs="0"/>
+					</xs:sequence>
+					<xs:element ref="AgentName"/>
+				</xs:choice>
+				<xs:element ref="TelephoneNumber" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="FaxNumber" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="EmailAddress" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="Website" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="AgentRole" minOccurs="0"/>
+				<xs:choice>
+					<xs:element ref="MarketCountry"/>
+					<xs:sequence>
+						<xs:element ref="MarketTerritory"/>
+						<xs:element ref="MarketCountryExcluded" minOccurs="0"/>
+					</xs:sequence>
+				</xs:choice>
+				<xs:element ref="MarketRestrictionDetail" minOccurs="0"/>
+				<xs:element ref="MarketPublishingStatus" minOccurs="0"/>
+				<xs:element ref="MarketDate" minOccurs="0" maxOccurs="unbounded"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="MarketRepresentation"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="marketrepresentation"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="MarketRestrictionDetail">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="MarketRestrictionDetail"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j406"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="MarketTerritory">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="MarketTerritory"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j404"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Measure">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="MeasureTypeCode"/>
+				<xs:element ref="Measurement"/>
+				<xs:element ref="MeasureUnitCode"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Measure"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="measure"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="MeasureTypeCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List48">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="MeasureTypeCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="c093"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="MeasureUnitCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List50">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="MeasureUnitCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="c095"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Measurement">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Measurement"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="c094"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="MediaFile">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="MediaFileTypeCode"/>
+				<xs:element ref="MediaFileFormatCode" minOccurs="0"/>
+				<xs:element ref="ImageResolution" minOccurs="0"/>
+				<xs:element ref="MediaFileLinkTypeCode"/>
+				<xs:element ref="MediaFileLink"/>
+				<xs:choice minOccurs="0">
+					<xs:element ref="TextWithDownload"/>
+					<xs:sequence>
+						<xs:element ref="DownloadCaption"/>
+						<xs:element ref="DownloadCredit" minOccurs="0"/>
+						<xs:element ref="DownloadCopyrightNotice" minOccurs="0"/>
+					</xs:sequence>
+					<xs:sequence>
+						<xs:element ref="DownloadCredit"/>
+						<xs:element ref="DownloadCopyrightNotice" minOccurs="0"/>
+					</xs:sequence>
+					<xs:element ref="DownloadCopyrightNotice"/>
+				</xs:choice>
+				<xs:element ref="DownloadTerms" minOccurs="0"/>
+				<xs:element ref="MediaFileDate" minOccurs="0"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="MediaFile"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="mediafile"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="MediaFileDate">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="MediaFileDate"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="f373"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="MediaFileFormatCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List39">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="MediaFileFormatCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="f115"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="MediaFileLink">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="MediaFileLink"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="f117"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="MediaFileLinkTypeCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List40">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="MediaFileLinkTypeCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="f116"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="MediaFileTypeCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List38">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="MediaFileTypeCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="f114"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="MessageNote">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="MessageNote"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="m183"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="MessageNumber">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="MessageNumber"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="m180"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="MessageRepeat">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="MessageRepeat"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="m181"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="MinimumOrderQuantity">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="MinimumOrderQuantity"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j263"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Name">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="PersonNameType"/>
+				<xs:choice>
+					<xs:sequence>
+						<xs:element ref="PersonName"/>
+						<xs:element ref="PersonNameInverted" minOccurs="0"/>
+						<xs:sequence minOccurs="0">
+							<xs:element ref="TitlesBeforeNames" minOccurs="0"/>
+							<xs:element ref="NamesBeforeKey" minOccurs="0"/>
+							<xs:element ref="PrefixToKey" minOccurs="0"/>
+							<xs:element ref="KeyNames"/>
+							<xs:element ref="NamesAfterKey" minOccurs="0"/>
+							<xs:element ref="SuffixToKey" minOccurs="0"/>
+							<xs:element ref="LettersAfterNames" minOccurs="0"/>
+							<xs:element ref="TitlesAfterNames" minOccurs="0"/>
+						</xs:sequence>
+						<xs:element ref="PersonNameIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+					</xs:sequence>
+					<xs:sequence>
+						<xs:element ref="PersonNameInverted"/>
+						<xs:sequence minOccurs="0">
+							<xs:element ref="TitlesBeforeNames" minOccurs="0"/>
+							<xs:element ref="NamesBeforeKey" minOccurs="0"/>
+							<xs:element ref="PrefixToKey" minOccurs="0"/>
+							<xs:element ref="KeyNames"/>
+							<xs:element ref="NamesAfterKey" minOccurs="0"/>
+							<xs:element ref="SuffixToKey" minOccurs="0"/>
+							<xs:element ref="LettersAfterNames" minOccurs="0"/>
+							<xs:element ref="TitlesAfterNames" minOccurs="0"/>
+						</xs:sequence>
+						<xs:element ref="PersonNameIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+					</xs:sequence>
+					<xs:sequence>
+						<xs:element ref="TitlesBeforeNames" minOccurs="0"/>
+						<xs:element ref="NamesBeforeKey" minOccurs="0"/>
+						<xs:element ref="PrefixToKey" minOccurs="0"/>
+						<xs:element ref="KeyNames"/>
+						<xs:element ref="NamesAfterKey" minOccurs="0"/>
+						<xs:element ref="SuffixToKey" minOccurs="0"/>
+						<xs:element ref="LettersAfterNames" minOccurs="0"/>
+						<xs:element ref="TitlesAfterNames" minOccurs="0"/>
+						<xs:element ref="PersonNameIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+					</xs:sequence>
+					<xs:element ref="PersonNameIdentifier" maxOccurs="unbounded"/>
+				</xs:choice>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Name"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="name"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="NameCodeType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List44">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="NameCodeType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b241"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="NameCodeTypeName">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="NameCodeTypeName"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b242"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="NameCodeValue">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="NameCodeValue"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b243"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="NamesAfterKey">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="NamesAfterKey"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b041"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="NamesBeforeKey">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="NamesBeforeKey"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b039"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="NewSupplier">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:choice>
+					<xs:sequence>
+						<xs:choice>
+							<xs:element ref="SupplierIdentifier" maxOccurs="unbounded"/>
+							<xs:element ref="SupplierSAN"/>
+							<xs:sequence>
+								<xs:element ref="SupplierEANLocationNumber"/>
+								<xs:element ref="SupplierSAN" minOccurs="0"/>
+							</xs:sequence>
+						</xs:choice>
+						<xs:element ref="SupplierName" minOccurs="0"/>
+					</xs:sequence>
+					<xs:element ref="SupplierName"/>
+				</xs:choice>
+				<xs:element ref="TelephoneNumber" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="FaxNumber" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="EmailAddress" minOccurs="0" maxOccurs="unbounded"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="NewSupplier"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="newsupplier"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="NoContributor">
+		<xs:complexType>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="NoContributor"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="n339"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="NoEdition">
+		<xs:complexType>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="NoEdition"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="n386"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="NoSeries">
+		<xs:complexType>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="NoSeries"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="n338"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="NotForSale">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:choice>
+					<xs:sequence>
+						<xs:element ref="RightsCountry" maxOccurs="unbounded"/>
+						<xs:element ref="RightsTerritory" minOccurs="0"/>
+					</xs:sequence>
+					<xs:element ref="RightsTerritory"/>
+				</xs:choice>
+				<xs:element ref="ISBN" minOccurs="0"/>
+				<xs:element ref="EAN13" minOccurs="0"/>
+				<xs:element ref="ProductIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="PublisherName" minOccurs="0"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="NotForSale"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="notforsale"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="NotificationType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List1">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="NotificationType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="a002"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Number">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Number"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b257"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="NumberOfIllustrations">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="NumberOfIllustrations"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b125"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="NumberOfPages">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="NumberOfPages"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b061"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="NumberOfPieces">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="NumberOfPieces"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b210"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="NumberWithinSeries">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="NumberWithinSeries"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b019"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="OnHand">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="OnHand"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j350"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="OnOrder">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="OnOrder"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j351"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="OnOrderDetail">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="OnOrder"/>
+				<xs:element ref="ExpectedDate"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="OnOrderDetail"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="onorderdetail"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="OnSaleDate">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="OnSaleDate"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j143"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="OrderTime">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="OrderTime"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j144"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="OriginalLanguage">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List74">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="OriginalLanguage"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b060"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="OriginalPublisher">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="OriginalPublisher"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b240"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="OtherText">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="TextTypeCode"/>
+				<xs:element ref="TextFormat" minOccurs="0"/>
+				<xs:choice>
+					<xs:element ref="Text"/>
+					<xs:sequence>
+						<xs:element ref="TextLinkType"/>
+						<xs:element ref="TextLink"/>
+					</xs:sequence>
+				</xs:choice>
+				<xs:element ref="TextAuthor" minOccurs="0"/>
+				<xs:element ref="TextSourceCorporate" minOccurs="0"/>
+				<xs:element ref="TextSourceTitle" minOccurs="0"/>
+				<xs:element ref="TextPublicationDate" minOccurs="0"/>
+				<xs:sequence minOccurs="0">
+					<xs:element ref="StartDate"/>
+					<xs:element ref="EndDate"/>
+				</xs:sequence>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="OtherText"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="othertext"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="OutOfPrintDate">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="OutOfPrintDate"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="h134"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PackQuantity">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PackQuantity"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j145"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PageRun">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="FirstPageNumber"/>
+				<xs:element ref="LastPageNumber" minOccurs="0"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PageRun"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="pagerun"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PagesArabic">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PagesArabic"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b255"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PagesRoman">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PagesRoman"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b254"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ParentIdentifier">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="SeriesIDType"/>
+				<xs:element ref="IDTypeName" minOccurs="0"/>
+				<xs:element ref="IDValue"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ParentIdentifier"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="parentidentifier"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Percent">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Percent"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b337"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PersonAsSubject">
+		<xs:complexType>
+			<xs:choice>
+				<xs:sequence>
+					<xs:element ref="PersonName"/>
+					<xs:element ref="PersonNameInverted" minOccurs="0"/>
+					<xs:sequence minOccurs="0">
+						<xs:element ref="TitlesBeforeNames" minOccurs="0"/>
+						<xs:element ref="NamesBeforeKey" minOccurs="0"/>
+						<xs:element ref="PrefixToKey" minOccurs="0"/>
+						<xs:element ref="KeyNames"/>
+						<xs:element ref="NamesAfterKey" minOccurs="0"/>
+						<xs:element ref="SuffixToKey" minOccurs="0"/>
+						<xs:element ref="LettersAfterNames" minOccurs="0"/>
+						<xs:element ref="TitlesAfterNames" minOccurs="0"/>
+					</xs:sequence>
+					<xs:element ref="Name" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:element ref="PersonNameIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+				</xs:sequence>
+				<xs:sequence>
+					<xs:element ref="PersonNameInverted"/>
+					<xs:sequence minOccurs="0">
+						<xs:element ref="TitlesBeforeNames" minOccurs="0"/>
+						<xs:element ref="NamesBeforeKey" minOccurs="0"/>
+						<xs:element ref="PrefixToKey" minOccurs="0"/>
+						<xs:element ref="KeyNames"/>
+						<xs:element ref="NamesAfterKey" minOccurs="0"/>
+						<xs:element ref="SuffixToKey" minOccurs="0"/>
+						<xs:element ref="LettersAfterNames" minOccurs="0"/>
+						<xs:element ref="TitlesAfterNames" minOccurs="0"/>
+					</xs:sequence>
+					<xs:element ref="Name" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:element ref="PersonNameIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+				</xs:sequence>
+				<xs:sequence>
+					<xs:element ref="TitlesBeforeNames" minOccurs="0"/>
+					<xs:element ref="NamesBeforeKey" minOccurs="0"/>
+					<xs:element ref="PrefixToKey" minOccurs="0"/>
+					<xs:element ref="KeyNames"/>
+					<xs:element ref="NamesAfterKey" minOccurs="0"/>
+					<xs:element ref="SuffixToKey" minOccurs="0"/>
+					<xs:element ref="LettersAfterNames" minOccurs="0"/>
+					<xs:element ref="TitlesAfterNames" minOccurs="0"/>
+					<xs:element ref="Name" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:element ref="PersonNameIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+				</xs:sequence>
+				<xs:sequence>
+					<xs:element ref="Name" maxOccurs="unbounded"/>
+					<xs:element ref="PersonNameIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+				</xs:sequence>
+				<xs:element ref="PersonNameIdentifier" maxOccurs="unbounded"/>
+			</xs:choice>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PersonAsSubject"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="personassubject"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PersonDate">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="PersonDateRole"/>
+				<xs:element ref="DateFormat" minOccurs="0"/>
+				<xs:element ref="Date"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PersonDate"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="persondate"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PersonDateRole">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List75">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PersonDateRole"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b305"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PersonName">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PersonName"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b036"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PersonNameIDType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List101">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PersonNameIDType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b390"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PersonNameIdentifier">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="PersonNameIDType"/>
+				<xs:element ref="IDTypeName" minOccurs="0"/>
+				<xs:element ref="IDValue"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PersonNameIdentifier"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="personnameidentifier"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PersonNameInverted">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PersonNameInverted"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b037"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PersonNameType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List18">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PersonNameType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b250"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PlaceAsSubject">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PlaceAsSubject"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b072"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PrefixToKey">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PrefixToKey"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b247"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Price">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="PriceTypeCode" minOccurs="0"/>
+				<xs:element ref="PriceQualifier" minOccurs="0"/>
+				<xs:element ref="PriceTypeDescription" minOccurs="0"/>
+				<xs:element ref="PricePer" minOccurs="0"/>
+				<xs:element ref="MinimumOrderQuantity" minOccurs="0"/>
+				<xs:element ref="BatchBonus" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="ClassOfTrade" minOccurs="0"/>
+				<xs:element ref="BICDiscountGroupCode" minOccurs="0"/>
+				<xs:element ref="DiscountCoded" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="DiscountPercent" minOccurs="0"/>
+				<xs:element ref="PriceStatus" minOccurs="0"/>
+				<xs:element ref="PriceAmount"/>
+				<xs:element ref="CurrencyCode" minOccurs="0"/>
+				<xs:sequence minOccurs="0">
+					<xs:choice>
+						<xs:sequence>
+							<xs:element ref="CountryCode" maxOccurs="unbounded"/>
+							<xs:element ref="Territory" minOccurs="0"/>
+						</xs:sequence>
+						<xs:element ref="Territory"/>
+					</xs:choice>
+					<xs:element ref="CountryExcluded" minOccurs="0"/>
+					<xs:element ref="TerritoryExcluded" minOccurs="0"/>
+				</xs:sequence>
+				<xs:sequence minOccurs="0">
+					<xs:element ref="TaxRateCode1"/>
+					<xs:element ref="TaxRatePercent1" minOccurs="0"/>
+					<xs:element ref="TaxableAmount1" minOccurs="0"/>
+					<xs:element ref="TaxAmount1" minOccurs="0"/>
+					<xs:sequence minOccurs="0">
+						<xs:element ref="TaxRateCode2"/>
+						<xs:element ref="TaxRatePercent2" minOccurs="0"/>
+						<xs:element ref="TaxableAmount2" minOccurs="0"/>
+						<xs:element ref="TaxAmount2" minOccurs="0"/>
+					</xs:sequence>
+				</xs:sequence>
+				<xs:element ref="PriceEffectiveFrom" minOccurs="0"/>
+				<xs:element ref="PriceEffectiveUntil" minOccurs="0"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Price"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="price"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PriceAmount">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PriceAmount"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j151"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PriceEffectiveFrom">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PriceEffectiveFrom"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j161"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PriceEffectiveUntil">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PriceEffectiveUntil"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j162"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PricePer">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List60">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PricePer"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j239"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PriceQualifier">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List59">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PriceQualifier"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j261"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PriceStatus">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List61">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PriceStatus"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j266"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PriceTypeCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List58">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PriceTypeCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j148"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PriceTypeDescription">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PriceTypeDescription"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j262"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Prize">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="PrizeName"/>
+				<xs:element ref="PrizeYear" minOccurs="0"/>
+				<xs:element ref="PrizeCountry" minOccurs="0"/>
+				<xs:element ref="PrizeCode" minOccurs="0"/>
+				<xs:element ref="PrizeJury" minOccurs="0"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Prize"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="prize"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PrizeCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List41">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PrizeCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="g129"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PrizeCountry">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List91">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PrizeCountry"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="g128"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PrizeJury">
+		<xs:complexType mixed="true">
+			<xs:choice minOccurs="0" maxOccurs="unbounded">
+				<xs:element ref="p"/>
+				<xs:element ref="h1"/>
+				<xs:element ref="h2"/>
+				<xs:element ref="h3"/>
+				<xs:element ref="h4"/>
+				<xs:element ref="h5"/>
+				<xs:element ref="h6"/>
+				<xs:element ref="div"/>
+				<xs:element ref="ul"/>
+				<xs:element ref="ol"/>
+				<xs:element ref="dl"/>
+				<xs:element ref="pre"/>
+				<xs:element ref="hr"/>
+				<xs:element ref="blockquote"/>
+				<xs:element ref="address"/>
+				<xs:element ref="table"/>
+				<xs:element ref="a"/>
+				<xs:element ref="br"/>
+				<xs:element ref="span"/>
+				<xs:element ref="bdo"/>
+				<xs:element ref="object"/>
+				<xs:element ref="img"/>
+				<xs:element ref="map"/>
+				<xs:element ref="tt"/>
+				<xs:element ref="i"/>
+				<xs:element ref="b"/>
+				<xs:element ref="big"/>
+				<xs:element ref="small"/>
+				<xs:element ref="em"/>
+				<xs:element ref="strong"/>
+				<xs:element ref="dfn"/>
+				<xs:element ref="code"/>
+				<xs:element ref="q"/>
+				<xs:element ref="sub"/>
+				<xs:element ref="sup"/>
+				<xs:element ref="samp"/>
+				<xs:element ref="kbd"/>
+				<xs:element ref="var"/>
+				<xs:element ref="cite"/>
+				<xs:element ref="abbr"/>
+				<xs:element ref="acronym"/>
+			</xs:choice>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PrizeJury"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="g343"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PrizeName">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PrizeName"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="g126"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PrizeYear">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PrizeYear"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="g127"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PrizesDescription">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PrizesDescription"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="g124"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Product">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="RecordReference"/>
+				<xs:element ref="NotificationType"/>
+				<xs:element ref="DeletionCode" minOccurs="0"/>
+				<xs:element ref="DeletionText" minOccurs="0"/>
+				<xs:element ref="RecordSourceType" minOccurs="0"/>
+				<xs:sequence minOccurs="0">
+					<xs:element ref="RecordSourceIdentifierType"/>
+					<xs:element ref="RecordSourceIdentifier"/>
+				</xs:sequence>
+				<xs:element ref="RecordSourceName" minOccurs="0"/>
+				<xs:sequence minOccurs="0">
+					<xs:choice>
+						<xs:sequence>
+							<xs:element ref="ISBN"/>
+							<xs:element ref="EAN13" minOccurs="0"/>
+							<xs:element ref="UPC" minOccurs="0"/>
+							<xs:element ref="PublisherProductNo" minOccurs="0"/>
+							<xs:element ref="ISMN" minOccurs="0"/>
+							<xs:element ref="DOI" minOccurs="0"/>
+							<xs:element ref="ProductIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+						</xs:sequence>
+						<xs:sequence>
+							<xs:element ref="EAN13"/>
+							<xs:element ref="UPC" minOccurs="0"/>
+							<xs:element ref="PublisherProductNo" minOccurs="0"/>
+							<xs:element ref="ISMN" minOccurs="0"/>
+							<xs:element ref="DOI" minOccurs="0"/>
+							<xs:element ref="ProductIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+						</xs:sequence>
+						<xs:sequence>
+							<xs:element ref="UPC"/>
+							<xs:element ref="PublisherProductNo" minOccurs="0"/>
+							<xs:element ref="ISMN" minOccurs="0"/>
+							<xs:element ref="DOI" minOccurs="0"/>
+							<xs:element ref="ProductIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+						</xs:sequence>
+						<xs:sequence>
+							<xs:element ref="PublisherProductNo"/>
+							<xs:element ref="ISMN" minOccurs="0"/>
+							<xs:element ref="DOI" minOccurs="0"/>
+							<xs:element ref="ProductIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+						</xs:sequence>
+						<xs:sequence>
+							<xs:element ref="ISMN"/>
+							<xs:element ref="DOI" minOccurs="0"/>
+							<xs:element ref="ProductIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+						</xs:sequence>
+						<xs:sequence>
+							<xs:element ref="DOI"/>
+							<xs:element ref="ProductIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+						</xs:sequence>
+						<xs:element ref="ProductIdentifier" maxOccurs="unbounded"/>
+					</xs:choice>
+					<xs:element ref="Barcode" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:element ref="ReplacesISBN" minOccurs="0"/>
+					<xs:element ref="ReplacesEAN13" minOccurs="0"/>
+					<xs:element ref="ProductForm"/>
+					<xs:element ref="ProductFormDetail" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:element ref="ProductFormFeature" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:element ref="BookFormDetail" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:element ref="ProductPackaging" minOccurs="0"/>
+					<xs:element ref="ProductFormDescription" minOccurs="0"/>
+					<xs:element ref="NumberOfPieces" minOccurs="0"/>
+					<xs:element ref="TradeCategory" minOccurs="0"/>
+					<xs:element ref="ProductContentType" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:element ref="ContainedItem" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:element ref="ProductClassification" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:sequence minOccurs="0">
+						<xs:element ref="EpubType"/>
+						<xs:element ref="EpubTypeVersion" minOccurs="0"/>
+						<xs:element ref="EpubTypeDescription" minOccurs="0"/>
+						<xs:sequence minOccurs="0">
+							<xs:element ref="EpubFormat"/>
+							<xs:element ref="EpubFormatVersion" minOccurs="0"/>
+						</xs:sequence>
+						<xs:element ref="EpubFormatDescription" minOccurs="0"/>
+						<xs:sequence minOccurs="0">
+							<xs:element ref="EpubSource"/>
+							<xs:element ref="EpubSourceVersion" minOccurs="0"/>
+						</xs:sequence>
+						<xs:element ref="EpubSourceDescription" minOccurs="0"/>
+						<xs:element ref="EpubTypeNote" minOccurs="0"/>
+					</xs:sequence>
+					<xs:choice minOccurs="0">
+						<xs:sequence>
+							<xs:element ref="SeriesISSN" minOccurs="0"/>
+							<xs:element ref="PublisherSeriesCode" minOccurs="0"/>
+							<xs:element ref="SeriesIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+							<xs:element ref="TitleOfSeries"/>
+							<xs:element ref="Contributor" minOccurs="0" maxOccurs="unbounded"/>
+							<xs:element ref="NumberWithinSeries" minOccurs="0"/>
+							<xs:element ref="YearOfAnnual" minOccurs="0"/>
+						</xs:sequence>
+						<xs:element ref="Series" maxOccurs="unbounded"/>
+						<xs:element ref="NoSeries"/>
+					</xs:choice>
+					<xs:choice minOccurs="0">
+						<xs:sequence>
+							<xs:element ref="ISBNOfSet" minOccurs="0"/>
+							<xs:element ref="EAN13OfSet" minOccurs="0"/>
+							<xs:element ref="ProductIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+							<xs:element ref="TitleOfSet"/>
+							<xs:element ref="SetPartNumber" minOccurs="0"/>
+							<xs:element ref="SetPartTitle" minOccurs="0"/>
+							<xs:element ref="ItemNumberWithinSet" minOccurs="0"/>
+							<xs:element ref="LevelSequenceNumber" minOccurs="0"/>
+							<xs:element ref="SetItemTitle" minOccurs="0"/>
+						</xs:sequence>
+						<xs:element ref="Set" maxOccurs="unbounded"/>
+					</xs:choice>
+					<xs:element ref="TextCaseFlag" minOccurs="0"/>
+					<xs:choice>
+						<xs:sequence>
+							<xs:choice>
+								<xs:sequence>
+									<xs:element ref="DistinctiveTitle"/>
+									<xs:sequence minOccurs="0">
+										<xs:element ref="TitlePrefix"/>
+										<xs:element ref="TitleWithoutPrefix"/>
+									</xs:sequence>
+								</xs:sequence>
+								<xs:sequence>
+									<xs:element ref="TitlePrefix"/>
+									<xs:element ref="TitleWithoutPrefix"/>
+								</xs:sequence>
+							</xs:choice>
+							<xs:element ref="Subtitle" minOccurs="0"/>
+							<xs:element ref="TranslationOfTitle" minOccurs="0"/>
+							<xs:element ref="FormerTitle" minOccurs="0" maxOccurs="unbounded"/>
+							<xs:element ref="Title" minOccurs="0" maxOccurs="unbounded"/>
+						</xs:sequence>
+						<xs:element ref="Title" maxOccurs="unbounded"/>
+					</xs:choice>
+					<xs:element ref="WorkIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:element ref="Website" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:sequence minOccurs="0">
+						<xs:element ref="ThesisType"/>
+						<xs:element ref="ThesisPresentedTo" minOccurs="0"/>
+						<xs:element ref="ThesisYear" minOccurs="0"/>
+					</xs:sequence>
+					<xs:choice minOccurs="0">
+						<xs:sequence>
+							<xs:element ref="Contributor" maxOccurs="unbounded"/>
+							<xs:element ref="ContributorStatement" minOccurs="0"/>
+						</xs:sequence>
+						<xs:element ref="NoContributor"/>
+					</xs:choice>
+					<xs:choice minOccurs="0">
+						<xs:element ref="ConferenceDescription"/>
+						<xs:sequence>
+							<xs:element ref="ConferenceRole" minOccurs="0"/>
+							<xs:element ref="ConferenceName"/>
+							<xs:element ref="ConferenceNumber" minOccurs="0"/>
+							<xs:element ref="ConferenceDate" minOccurs="0"/>
+							<xs:element ref="ConferencePlace" minOccurs="0"/>
+						</xs:sequence>
+						<xs:element ref="Conference" maxOccurs="unbounded"/>
+					</xs:choice>
+					<xs:choice>
+						<xs:sequence>
+							<xs:element ref="EditionTypeCode" minOccurs="0" maxOccurs="unbounded"/>
+							<xs:element ref="EditionNumber" minOccurs="0"/>
+							<xs:element ref="EditionVersionNumber" minOccurs="0"/>
+							<xs:element ref="EditionStatement" minOccurs="0"/>
+						</xs:sequence>
+						<xs:element ref="NoEdition"/>
+					</xs:choice>
+					<xs:element ref="ReligiousText" minOccurs="0"/>
+					<xs:element ref="LanguageOfText" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:element ref="OriginalLanguage" minOccurs="0"/>
+					<xs:element ref="Language" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:element ref="NumberOfPages" minOccurs="0"/>
+					<xs:element ref="PagesRoman" minOccurs="0"/>
+					<xs:element ref="PagesArabic" minOccurs="0"/>
+					<xs:element ref="Extent" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:element ref="NumberOfIllustrations" minOccurs="0"/>
+					<xs:element ref="IllustrationsNote" minOccurs="0"/>
+					<xs:element ref="Illustrations" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:element ref="MapScale" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:sequence minOccurs="0">
+						<xs:element ref="BASICMainSubject"/>
+						<xs:element ref="BASICVersion" minOccurs="0"/>
+					</xs:sequence>
+					<xs:sequence minOccurs="0">
+						<xs:element ref="BICMainSubject"/>
+						<xs:element ref="BICVersion" minOccurs="0"/>
+					</xs:sequence>
+					<xs:element ref="MainSubject" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:element ref="Subject" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:element ref="PersonAsSubject" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:element ref="CorporateBodyAsSubject" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:element ref="PlaceAsSubject" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:element ref="AudienceCode" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:element ref="Audience" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:element ref="USSchoolGrade" minOccurs="0"/>
+					<xs:element ref="InterestAge" minOccurs="0"/>
+					<xs:element ref="AudienceRange" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:element ref="AudienceDescription" minOccurs="0"/>
+					<xs:element ref="Complexity" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:element ref="Annotation" minOccurs="0"/>
+					<xs:element ref="MainDescription" minOccurs="0"/>
+					<xs:element ref="OtherText" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:element ref="ReviewQuote" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:sequence minOccurs="0">
+						<xs:element ref="CoverImageFormatCode"/>
+						<xs:element ref="CoverImageLinkTypeCode"/>
+						<xs:element ref="CoverImageLink"/>
+					</xs:sequence>
+					<xs:element ref="MediaFile" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:element ref="ProductWebsite" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:choice minOccurs="0">
+						<xs:element ref="PrizesDescription"/>
+						<xs:element ref="Prize" maxOccurs="unbounded"/>
+					</xs:choice>
+					<xs:element ref="ContentItem" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:choice>
+						<xs:sequence>
+							<xs:element ref="ImprintName"/>
+							<xs:element ref="Imprint" minOccurs="0" maxOccurs="unbounded"/>
+							<xs:element ref="PublisherName" minOccurs="0"/>
+							<xs:element ref="Publisher" minOccurs="0" maxOccurs="unbounded"/>
+						</xs:sequence>
+						<xs:sequence>
+							<xs:element ref="Imprint" maxOccurs="unbounded"/>
+							<xs:element ref="PublisherName" minOccurs="0"/>
+							<xs:element ref="Publisher" minOccurs="0" maxOccurs="unbounded"/>
+						</xs:sequence>
+						<xs:sequence>
+							<xs:element ref="PublisherName"/>
+							<xs:element ref="Publisher" minOccurs="0" maxOccurs="unbounded"/>
+						</xs:sequence>
+						<xs:element ref="Publisher" maxOccurs="unbounded"/>
+					</xs:choice>
+					<xs:element ref="CityOfPublication" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:element ref="CountryOfPublication" minOccurs="0"/>
+					<xs:element ref="CopublisherName" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:element ref="SponsorName" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:element ref="OriginalPublisher" minOccurs="0"/>
+					<xs:sequence minOccurs="0">
+						<xs:element ref="PublishingStatus"/>
+						<xs:element ref="PublishingStatusNote" minOccurs="0"/>
+					</xs:sequence>
+					<xs:element ref="AnnouncementDate" minOccurs="0"/>
+					<xs:element ref="TradeAnnouncementDate" minOccurs="0"/>
+					<xs:element ref="PublicationDate" minOccurs="0"/>
+					<xs:choice minOccurs="0">
+						<xs:element ref="CopyrightStatement" maxOccurs="unbounded"/>
+						<xs:element ref="CopyrightYear"/>
+					</xs:choice>
+					<xs:element ref="YearFirstPublished" minOccurs="0"/>
+					<xs:element ref="SalesRights" minOccurs="0" maxOccurs="3"/>
+					<xs:element ref="NotForSale" minOccurs="0" maxOccurs="unbounded"/>
+					<xs:element ref="SalesRestriction" minOccurs="0" maxOccurs="unbounded"/>
+				</xs:sequence>
+				<xs:choice minOccurs="0">
+					<xs:sequence>
+						<xs:choice>
+							<xs:sequence>
+								<xs:sequence>
+									<xs:element ref="Height"/>
+									<xs:element ref="Width" minOccurs="0"/>
+									<xs:element ref="Thickness" minOccurs="0"/>
+								</xs:sequence>
+								<xs:element ref="Weight" minOccurs="0"/>
+							</xs:sequence>
+							<xs:element ref="Weight"/>
+							<xs:element ref="Measure" maxOccurs="unbounded"/>
+						</xs:choice>
+						<xs:element ref="Dimensions" minOccurs="0"/>
+					</xs:sequence>
+					<xs:element ref="Dimensions"/>
+				</xs:choice>
+				<xs:element ref="ReplacedByISBN" minOccurs="0"/>
+				<xs:element ref="ReplacedByEAN13" minOccurs="0"/>
+				<xs:element ref="AlternativeFormatISBN" minOccurs="0"/>
+				<xs:element ref="AlternativeFormatEAN13" minOccurs="0"/>
+				<xs:element ref="AlternativeProductISBN" minOccurs="0"/>
+				<xs:element ref="AlternativeProductEAN13" minOccurs="0"/>
+				<xs:element ref="RelatedProduct" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="OutOfPrintDate" minOccurs="0"/>
+				<xs:element ref="SupplyDetail" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="MarketRepresentation" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="PromotionCampaign" minOccurs="0"/>
+				<xs:element ref="PromotionContact" minOccurs="0"/>
+				<xs:element ref="InitialPrintRun" minOccurs="0"/>
+				<xs:element ref="ReprintDetail" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="CopiesSold" minOccurs="0"/>
+				<xs:element ref="BookClubAdoption" minOccurs="0"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Product"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="product"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ProductAvailability">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List65">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ProductAvailability"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j396"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ProductClassification">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="ProductClassificationType"/>
+				<xs:element ref="ProductClassificationCode"/>
+				<xs:element ref="Percent" minOccurs="0"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ProductClassification"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="productclassification"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ProductClassificationCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ProductClassificationCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b275"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ProductClassificationType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List9">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ProductClassificationType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b274"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ProductContentType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List81">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ProductContentType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b385"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ProductForm">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List7">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ProductForm"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b012"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ProductFormDescription">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ProductFormDescription"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b014"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ProductFormDetail">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List78">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ProductFormDetail"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b333"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ProductFormFeature">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="ProductFormFeatureType"/>
+				<xs:element ref="ProductFormFeatureValue" minOccurs="0"/>
+				<xs:element ref="ProductFormFeatureDescription" minOccurs="0"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ProductFormFeature"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="productformfeature"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ProductFormFeatureDescription">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ProductFormFeatureDescription"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b336"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ProductFormFeatureType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List79">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ProductFormFeatureType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b334"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ProductFormFeatureValue">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ProductFormFeatureValue"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b335"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ProductIDType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List5">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ProductIDType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b221"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ProductIdentifier">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="ProductIDType"/>
+				<xs:element ref="IDTypeName" minOccurs="0"/>
+				<xs:element ref="IDValue"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ProductIdentifier"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="productidentifier"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ProductPackaging">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List80">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ProductPackaging"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b225"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ProductWebsite">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="WebsiteRole" minOccurs="0"/>
+				<xs:element ref="ProductWebsiteDescription" minOccurs="0"/>
+				<xs:element ref="ProductWebsiteLink"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ProductWebsite"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="productwebsite"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ProductWebsiteDescription">
+		<xs:complexType mixed="true">
+			<xs:choice minOccurs="0" maxOccurs="unbounded">
+				<xs:element ref="p"/>
+				<xs:element ref="h1"/>
+				<xs:element ref="h2"/>
+				<xs:element ref="h3"/>
+				<xs:element ref="h4"/>
+				<xs:element ref="h5"/>
+				<xs:element ref="h6"/>
+				<xs:element ref="div"/>
+				<xs:element ref="ul"/>
+				<xs:element ref="ol"/>
+				<xs:element ref="dl"/>
+				<xs:element ref="pre"/>
+				<xs:element ref="hr"/>
+				<xs:element ref="blockquote"/>
+				<xs:element ref="address"/>
+				<xs:element ref="table"/>
+				<xs:element ref="a"/>
+				<xs:element ref="br"/>
+				<xs:element ref="span"/>
+				<xs:element ref="bdo"/>
+				<xs:element ref="object"/>
+				<xs:element ref="img"/>
+				<xs:element ref="map"/>
+				<xs:element ref="tt"/>
+				<xs:element ref="i"/>
+				<xs:element ref="b"/>
+				<xs:element ref="big"/>
+				<xs:element ref="small"/>
+				<xs:element ref="em"/>
+				<xs:element ref="strong"/>
+				<xs:element ref="dfn"/>
+				<xs:element ref="code"/>
+				<xs:element ref="q"/>
+				<xs:element ref="sub"/>
+				<xs:element ref="sup"/>
+				<xs:element ref="samp"/>
+				<xs:element ref="kbd"/>
+				<xs:element ref="var"/>
+				<xs:element ref="cite"/>
+				<xs:element ref="abbr"/>
+				<xs:element ref="acronym"/>
+			</xs:choice>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ProductWebsiteDescription"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="f170"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ProductWebsiteLink">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ProductWebsiteLink"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="f123"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ProfessionalAffiliation">
+		<xs:complexType>
+			<xs:choice>
+				<xs:sequence>
+					<xs:element ref="ProfessionalPosition"/>
+					<xs:element ref="Affiliation" minOccurs="0"/>
+				</xs:sequence>
+				<xs:element ref="Affiliation"/>
+			</xs:choice>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ProfessionalAffiliation"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="professionalaffiliation"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ProfessionalPosition">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ProfessionalPosition"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b045"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PromotionCampaign">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PromotionCampaign"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="k165"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PromotionContact">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PromotionContact"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="k166"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PublicationDate">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PublicationDate"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b003"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Publisher">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="PublishingRole" minOccurs="0"/>
+				<xs:choice>
+					<xs:element ref="PublisherName"/>
+					<xs:sequence>
+						<xs:element ref="NameCodeType"/>
+						<xs:element ref="NameCodeTypeName" minOccurs="0"/>
+						<xs:element ref="NameCodeValue"/>
+						<xs:element ref="PublisherName" minOccurs="0"/>
+					</xs:sequence>
+				</xs:choice>
+				<xs:element ref="Website" minOccurs="0" maxOccurs="unbounded"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Publisher"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="publisher"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PublisherName">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PublisherName"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b081"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PublisherProductNo">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PublisherProductNo"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b007"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PublisherSeriesCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PublisherSeriesCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b017"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PublishingRole">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List45">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PublishingRole"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b291"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PublishingStatus">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List64">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PublishingStatus"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b394"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="PublishingStatusNote">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="PublishingStatusNote"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b395"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="RecordReference">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="RecordReference"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="a001"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="RecordSourceIdentifier">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="RecordSourceIdentifier"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="a196"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="RecordSourceIdentifierType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List44">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="RecordSourceIdentifierType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="a195"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="RecordSourceName">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="RecordSourceName"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="a197"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="RecordSourceType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List3">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="RecordSourceType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="a194"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="RegionCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="RegionCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b398"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Reissue">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="ReissueDate"/>
+				<xs:element ref="ReissueDescription" minOccurs="0"/>
+				<xs:element ref="Price" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="MediaFile" minOccurs="0" maxOccurs="unbounded"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Reissue"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="reissue"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ReissueDate">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ReissueDate"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j365"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ReissueDescription">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ReissueDescription"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j366"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="RelatedProduct">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="RelationCode"/>
+				<xs:choice>
+					<xs:sequence>
+						<xs:element ref="ISBN"/>
+						<xs:element ref="EAN13" minOccurs="0"/>
+						<xs:element ref="ProductIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+						<xs:element ref="Website" minOccurs="0" maxOccurs="unbounded"/>
+						<xs:sequence minOccurs="0">
+							<xs:element ref="ProductForm"/>
+							<xs:element ref="ProductFormDetail" minOccurs="0" maxOccurs="unbounded"/>
+							<xs:element ref="ProductFormFeature" minOccurs="0" maxOccurs="unbounded"/>
+							<xs:element ref="BookFormDetail" minOccurs="0" maxOccurs="unbounded"/>
+							<xs:element ref="ProductPackaging" minOccurs="0"/>
+							<xs:element ref="ProductFormDescription" minOccurs="0"/>
+						</xs:sequence>
+					</xs:sequence>
+					<xs:sequence>
+						<xs:element ref="EAN13"/>
+						<xs:element ref="ProductIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+						<xs:element ref="Website" minOccurs="0" maxOccurs="unbounded"/>
+						<xs:sequence minOccurs="0">
+							<xs:element ref="ProductForm"/>
+							<xs:element ref="ProductFormDetail" minOccurs="0" maxOccurs="unbounded"/>
+							<xs:element ref="ProductFormFeature" minOccurs="0" maxOccurs="unbounded"/>
+							<xs:element ref="BookFormDetail" minOccurs="0" maxOccurs="unbounded"/>
+							<xs:element ref="ProductPackaging" minOccurs="0"/>
+							<xs:element ref="ProductFormDescription" minOccurs="0"/>
+						</xs:sequence>
+					</xs:sequence>
+					<xs:sequence>
+						<xs:element ref="ProductIdentifier" maxOccurs="unbounded"/>
+						<xs:element ref="Website" minOccurs="0" maxOccurs="unbounded"/>
+						<xs:sequence minOccurs="0">
+							<xs:element ref="ProductForm"/>
+							<xs:element ref="ProductFormDetail" minOccurs="0" maxOccurs="unbounded"/>
+							<xs:element ref="ProductFormFeature" minOccurs="0" maxOccurs="unbounded"/>
+							<xs:element ref="BookFormDetail" minOccurs="0" maxOccurs="unbounded"/>
+							<xs:element ref="ProductPackaging" minOccurs="0"/>
+							<xs:element ref="ProductFormDescription" minOccurs="0"/>
+						</xs:sequence>
+					</xs:sequence>
+					<xs:sequence>
+						<xs:element ref="Website" minOccurs="0" maxOccurs="unbounded"/>
+						<xs:element ref="ProductForm"/>
+						<xs:element ref="ProductFormDetail" minOccurs="0" maxOccurs="unbounded"/>
+						<xs:element ref="ProductFormFeature" minOccurs="0" maxOccurs="unbounded"/>
+						<xs:element ref="BookFormDetail" minOccurs="0" maxOccurs="unbounded"/>
+						<xs:element ref="ProductPackaging" minOccurs="0"/>
+						<xs:element ref="ProductFormDescription" minOccurs="0"/>
+					</xs:sequence>
+				</xs:choice>
+				<xs:element ref="NumberOfPieces" minOccurs="0"/>
+				<xs:element ref="TradeCategory" minOccurs="0"/>
+				<xs:element ref="ProductContentType" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:sequence minOccurs="0">
+					<xs:element ref="EpubType"/>
+					<xs:element ref="EpubTypeVersion" minOccurs="0"/>
+					<xs:element ref="EpubTypeDescription" minOccurs="0"/>
+					<xs:sequence minOccurs="0">
+						<xs:element ref="EpubFormat"/>
+						<xs:element ref="EpubFormatVersion" minOccurs="0"/>
+					</xs:sequence>
+					<xs:element ref="EpubFormatDescription" minOccurs="0"/>
+					<xs:element ref="EpubTypeNote" minOccurs="0"/>
+				</xs:sequence>
+				<xs:element ref="Publisher" minOccurs="0" maxOccurs="unbounded"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="RelatedProduct"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="relatedproduct"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="RelationCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List51">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="RelationCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="h208"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ReligiousText">
+		<xs:complexType>
+			<xs:choice>
+				<xs:element ref="Bible"/>
+				<xs:sequence>
+					<xs:element ref="ReligiousTextID"/>
+					<xs:element ref="ReligiousTextFeature" maxOccurs="unbounded"/>
+				</xs:sequence>
+			</xs:choice>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ReligiousText"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="religioustext"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ReligiousTextFeature">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="ReligiousTextFeatureType"/>
+				<xs:element ref="ReligiousTextFeatureCode"/>
+				<xs:element ref="ReligiousTextFeatureDescription" minOccurs="0"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ReligiousTextFeature"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="religioustextfeature"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ReligiousTextFeatureCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List90">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ReligiousTextFeatureCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b359"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ReligiousTextFeatureDescription">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ReligiousTextFeatureDescription"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b360"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ReligiousTextFeatureType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List89">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ReligiousTextFeatureType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b358"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ReligiousTextID">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List88">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ReligiousTextID"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b376"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ReplacedByEAN13">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ReplacedByEAN13"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="h131"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ReplacedByISBN">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ReplacedByISBN"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="h130"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ReplacesEAN13">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ReplacesEAN13"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b011"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ReplacesISBN">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ReplacesISBN"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b010"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ReprintDetail">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ReprintDetail"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="k309"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ReturnsCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ReturnsCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j269"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ReturnsCodeType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List53">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ReturnsCodeType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j268"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ReviewQuote">
+		<xs:complexType mixed="true">
+			<xs:choice minOccurs="0" maxOccurs="unbounded">
+				<xs:element ref="p"/>
+				<xs:element ref="h1"/>
+				<xs:element ref="h2"/>
+				<xs:element ref="h3"/>
+				<xs:element ref="h4"/>
+				<xs:element ref="h5"/>
+				<xs:element ref="h6"/>
+				<xs:element ref="div"/>
+				<xs:element ref="ul"/>
+				<xs:element ref="ol"/>
+				<xs:element ref="dl"/>
+				<xs:element ref="pre"/>
+				<xs:element ref="hr"/>
+				<xs:element ref="blockquote"/>
+				<xs:element ref="address"/>
+				<xs:element ref="table"/>
+				<xs:element ref="a"/>
+				<xs:element ref="br"/>
+				<xs:element ref="span"/>
+				<xs:element ref="bdo"/>
+				<xs:element ref="object"/>
+				<xs:element ref="img"/>
+				<xs:element ref="map"/>
+				<xs:element ref="tt"/>
+				<xs:element ref="i"/>
+				<xs:element ref="b"/>
+				<xs:element ref="big"/>
+				<xs:element ref="small"/>
+				<xs:element ref="em"/>
+				<xs:element ref="strong"/>
+				<xs:element ref="dfn"/>
+				<xs:element ref="code"/>
+				<xs:element ref="q"/>
+				<xs:element ref="sub"/>
+				<xs:element ref="sup"/>
+				<xs:element ref="samp"/>
+				<xs:element ref="kbd"/>
+				<xs:element ref="var"/>
+				<xs:element ref="cite"/>
+				<xs:element ref="abbr"/>
+				<xs:element ref="acronym"/>
+			</xs:choice>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ReviewQuote"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="e110"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="RightsCountry">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="CountryCodeList">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="RightsCountry"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b090"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="RightsRegion">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List47">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="RightsRegion"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b091"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="RightsTerritory">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="TerritoryCodeList">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="RightsTerritory"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b388"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SalesOutlet">
+		<xs:complexType>
+			<xs:choice>
+				<xs:sequence>
+					<xs:element ref="SalesOutletIdentifier"/>
+					<xs:element ref="SalesOutletName" minOccurs="0"/>
+				</xs:sequence>
+				<xs:element ref="SalesOutletName"/>
+			</xs:choice>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SalesOutlet"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="salesoutlet"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SalesOutletIDType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List102">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SalesOutletIDType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b393"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SalesOutletIdentifier">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="SalesOutletIDType"/>
+				<xs:element ref="IDTypeName" minOccurs="0"/>
+				<xs:element ref="IDValue"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SalesOutletIdentifier"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="salesoutletidentifier"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SalesOutletName">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SalesOutletName"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b382"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SalesRestriction">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="SalesRestrictionType"/>
+				<xs:element ref="SalesOutlet" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="SalesRestrictionDetail" minOccurs="0"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SalesRestriction"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="salesrestriction"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SalesRestrictionDetail">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SalesRestrictionDetail"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b383"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SalesRestrictionType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List71">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SalesRestrictionType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b381"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SalesRights">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="SalesRightsType"/>
+				<xs:choice>
+					<xs:sequence>
+						<xs:element ref="RightsCountry" maxOccurs="unbounded"/>
+						<xs:element ref="RightsTerritory" minOccurs="0"/>
+						<xs:element ref="RightsRegion" minOccurs="0" maxOccurs="unbounded"/>
+					</xs:sequence>
+					<xs:element ref="RightsTerritory"/>
+					<xs:element ref="RightsRegion" maxOccurs="unbounded"/>
+				</xs:choice>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SalesRights"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="salesrights"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SalesRightsType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List46">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SalesRightsType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b089"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SenderIDType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List44">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SenderIDType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="m379"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SenderIdentifier">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="SenderIDType"/>
+				<xs:element ref="IDTypeName" minOccurs="0"/>
+				<xs:element ref="IDValue"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SenderIdentifier"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="senderidentifier"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SentDate">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SentDate"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="m182"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SequenceNumber">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SequenceNumber"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b034"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SequenceNumberWithinRole">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SequenceNumberWithinRole"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b340"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Series">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="SeriesISSN" minOccurs="0"/>
+				<xs:element ref="PublisherSeriesCode" minOccurs="0"/>
+				<xs:element ref="SeriesIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:choice>
+					<xs:sequence>
+						<xs:element ref="TitleOfSeries"/>
+						<xs:element ref="Title" minOccurs="0" maxOccurs="unbounded"/>
+					</xs:sequence>
+					<xs:element ref="Title" maxOccurs="unbounded"/>
+				</xs:choice>
+				<xs:element ref="Contributor" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="NumberWithinSeries" minOccurs="0"/>
+				<xs:element ref="YearOfAnnual" minOccurs="0"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Series"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="series"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SeriesIDType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List13">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SeriesIDType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b273"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SeriesISSN">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SeriesISSN"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b016"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SeriesIdentifier">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="SeriesIDType"/>
+				<xs:element ref="IDTypeName" minOccurs="0"/>
+				<xs:element ref="IDValue"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SeriesIdentifier"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="seriesidentifier"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SeriesPartName">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SeriesPartName"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b282"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Set">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="ISBNOfSet" minOccurs="0"/>
+				<xs:element ref="EAN13OfSet" minOccurs="0"/>
+				<xs:element ref="ProductIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:choice>
+					<xs:sequence>
+						<xs:element ref="TitleOfSet"/>
+						<xs:element ref="Title" minOccurs="0" maxOccurs="unbounded"/>
+					</xs:sequence>
+					<xs:element ref="Title" maxOccurs="unbounded"/>
+				</xs:choice>
+				<xs:element ref="SetPartNumber" minOccurs="0"/>
+				<xs:element ref="SetPartTitle" minOccurs="0"/>
+				<xs:element ref="ItemNumberWithinSet" minOccurs="0"/>
+				<xs:element ref="LevelSequenceNumber" minOccurs="0"/>
+				<xs:element ref="SetItemTitle" minOccurs="0"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Set"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="set"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SetItemTitle">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SetItemTitle"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b281"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SetPartNumber">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SetPartNumber"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b024"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SetPartTitle">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SetPartTitle"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b025"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SponsorName">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SponsorName"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b085"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="StartDate">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="StartDate"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b324"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Stock">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="LocationIdentifier" minOccurs="0"/>
+				<xs:element ref="LocationName" minOccurs="0"/>
+				<xs:choice>
+					<xs:sequence>
+						<xs:element ref="StockQuantityCoded"/>
+						<xs:element ref="OnHand" minOccurs="0"/>
+					</xs:sequence>
+					<xs:element ref="OnHand"/>
+				</xs:choice>
+				<xs:element ref="OnOrder" minOccurs="0"/>
+				<xs:element ref="CBO" minOccurs="0"/>
+				<xs:element ref="OnOrderDetail" minOccurs="0" maxOccurs="unbounded"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Stock"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="stock"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="StockQuantityCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="StockQuantityCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j297"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="StockQuantityCodeType" type="List70"/>
+	<xs:element name="StockQuantityCodeTypeName">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="StockQuantityCodeTypeName"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j296"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="StockQuantityCoded">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="StockQuantityCodeType"/>
+				<xs:element ref="StockQuantityCodeTypeName" minOccurs="0"/>
+				<xs:element ref="StockQuantityCode"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="StockQuantityCoded"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="stockquantitycoded"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="StudyBibleType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List84">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="StudyBibleType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b389"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SubSeriesRecord">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="RecordReference"/>
+				<xs:element ref="NotificationType"/>
+				<xs:element ref="DeletionCode" minOccurs="0"/>
+				<xs:element ref="DeletionText" minOccurs="0"/>
+				<xs:element ref="RecordSourceType" minOccurs="0"/>
+				<xs:sequence minOccurs="0">
+					<xs:element ref="RecordSourceIdentifierType"/>
+					<xs:element ref="RecordSourceIdentifier"/>
+				</xs:sequence>
+				<xs:element ref="RecordSourceName" minOccurs="0"/>
+				<xs:element ref="SeriesIdentifier" maxOccurs="unbounded"/>
+				<xs:element ref="ParentIdentifier"/>
+				<xs:element ref="LevelSequenceNumber"/>
+				<xs:sequence minOccurs="0">
+					<xs:element ref="SeriesPartName" minOccurs="0"/>
+					<xs:element ref="NumberWithinSeries"/>
+				</xs:sequence>
+				<xs:element ref="Title" maxOccurs="unbounded"/>
+				<xs:element ref="Contributor" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="OtherText" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="Publisher" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="SubordinateEntries" minOccurs="0"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SubSeriesRecord"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="subseriesrecord"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Subject">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="SubjectSchemeIdentifier"/>
+				<xs:element ref="SubjectSchemeName" minOccurs="0"/>
+				<xs:element ref="SubjectSchemeVersion" minOccurs="0"/>
+				<xs:choice>
+					<xs:sequence>
+						<xs:element ref="SubjectCode"/>
+						<xs:element ref="SubjectHeadingText" minOccurs="0"/>
+					</xs:sequence>
+					<xs:element ref="SubjectHeadingText"/>
+				</xs:choice>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Subject"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="subject"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SubjectCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SubjectCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b069"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SubjectHeadingText">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SubjectHeadingText"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b070"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SubjectSchemeIdentifier">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List27">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SubjectSchemeIdentifier"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b067"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SubjectSchemeName">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SubjectSchemeName"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b171"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SubjectSchemeVersion">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SubjectSchemeVersion"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b068"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SubordinateEntries">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SubordinateEntries"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="a245"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Subtitle">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Subtitle"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b029"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SuffixToKey">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SuffixToKey"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b248"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SupplierEANLocationNumber">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SupplierEANLocationNumber"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j135"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SupplierIDType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List92">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SupplierIDType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j345"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SupplierIdentifier">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="SupplierIDType"/>
+				<xs:element ref="IDTypeName" minOccurs="0"/>
+				<xs:element ref="IDValue"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SupplierIdentifier"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="supplieridentifier"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SupplierName">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SupplierName"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j137"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SupplierRole">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List93">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SupplierRole"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j292"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SupplierSAN">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SupplierSAN"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j136"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SupplyDetail">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:choice>
+					<xs:sequence>
+						<xs:choice>
+							<xs:element ref="SupplierIdentifier" maxOccurs="unbounded"/>
+							<xs:element ref="SupplierSAN"/>
+							<xs:sequence>
+								<xs:element ref="SupplierEANLocationNumber"/>
+								<xs:element ref="SupplierSAN" minOccurs="0"/>
+							</xs:sequence>
+						</xs:choice>
+						<xs:element ref="SupplierName" minOccurs="0"/>
+					</xs:sequence>
+					<xs:element ref="SupplierName"/>
+				</xs:choice>
+				<xs:element ref="TelephoneNumber" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="FaxNumber" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="EmailAddress" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="Website" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="SupplierRole" minOccurs="0"/>
+				<xs:sequence minOccurs="0">
+					<xs:choice>
+						<xs:sequence>
+							<xs:element ref="SupplyToCountry" maxOccurs="unbounded"/>
+							<xs:element ref="SupplyToTerritory" minOccurs="0"/>
+							<xs:element ref="SupplyToRegion" minOccurs="0" maxOccurs="unbounded"/>
+						</xs:sequence>
+						<xs:element ref="SupplyToTerritory"/>
+						<xs:element ref="SupplyToRegion" maxOccurs="unbounded"/>
+					</xs:choice>
+					<xs:element ref="SupplyToCountryExcluded" minOccurs="0" maxOccurs="unbounded"/>
+				</xs:sequence>
+				<xs:element ref="SupplyRestrictionDetail" minOccurs="0"/>
+				<xs:sequence minOccurs="0">
+					<xs:element ref="ReturnsCodeType"/>
+					<xs:element ref="ReturnsCode"/>
+				</xs:sequence>
+				<xs:element ref="LastDateForReturns" minOccurs="0"/>
+				<xs:choice>
+					<xs:sequence>
+						<xs:element ref="AvailabilityCode"/>
+						<xs:element ref="ProductAvailability" minOccurs="0"/>
+						<xs:element ref="IntermediaryAvailabilityCode" minOccurs="0"/>
+					</xs:sequence>
+					<xs:sequence>
+						<xs:element ref="ProductAvailability"/>
+						<xs:element ref="IntermediaryAvailabilityCode" minOccurs="0"/>
+					</xs:sequence>
+					<xs:element ref="IntermediaryAvailabilityCode"/>
+				</xs:choice>
+				<xs:element ref="NewSupplier" minOccurs="0"/>
+				<xs:sequence minOccurs="0">
+					<xs:element ref="DateFormat" minOccurs="0"/>
+					<xs:element ref="ExpectedShipDate"/>
+				</xs:sequence>
+				<xs:element ref="OnSaleDate" minOccurs="0"/>
+				<xs:element ref="OrderTime" minOccurs="0"/>
+				<xs:element ref="Stock" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:element ref="PackQuantity" minOccurs="0"/>
+				<xs:sequence minOccurs="0">
+					<xs:element ref="AudienceRestrictionFlag"/>
+					<xs:element ref="AudienceRestrictionNote" minOccurs="0"/>
+				</xs:sequence>
+				<xs:choice>
+					<xs:element ref="PriceAmount"/>
+					<xs:element ref="UnpricedItemType"/>
+					<xs:element ref="Price" maxOccurs="unbounded"/>
+				</xs:choice>
+				<xs:element ref="Reissue" minOccurs="0"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SupplyDetail"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="supplydetail"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SupplyRestrictionDetail">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SupplyRestrictionDetail"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j399"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SupplyToCountry">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="CountryCodeList">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SupplyToCountry"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j138"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SupplyToCountryExcluded">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="CountryCodeList">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SupplyToCountryExcluded"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j140"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SupplyToRegion">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List52">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SupplyToRegion"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j139"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="SupplyToTerritory">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="TerritoryCodeList">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="SupplyToTerritory"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j397"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TaxAmount1">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TaxAmount1"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j156"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TaxAmount2">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TaxAmount2"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j160"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TaxRateCode1">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List62">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TaxRateCode1"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j153"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TaxRateCode2">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List62">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TaxRateCode2"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j157"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TaxRatePercent1">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TaxRatePercent1"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j154"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TaxRatePercent2">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TaxRatePercent2"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j158"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TaxableAmount1">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TaxableAmount1"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j155"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TaxableAmount2">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TaxableAmount2"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j159"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TelephoneNumber">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TelephoneNumber"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j270"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Territory">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="TerritoryCodeList">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Territory"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j303"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TerritoryExcluded">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="TerritoryCodeList">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TerritoryExcluded"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j308"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Text">
+		<xs:complexType mixed="true">
+			<xs:choice minOccurs="0" maxOccurs="unbounded">
+				<xs:element ref="p"/>
+				<xs:element ref="h1"/>
+				<xs:element ref="h2"/>
+				<xs:element ref="h3"/>
+				<xs:element ref="h4"/>
+				<xs:element ref="h5"/>
+				<xs:element ref="h6"/>
+				<xs:element ref="div"/>
+				<xs:element ref="ul"/>
+				<xs:element ref="ol"/>
+				<xs:element ref="dl"/>
+				<xs:element ref="pre"/>
+				<xs:element ref="hr"/>
+				<xs:element ref="blockquote"/>
+				<xs:element ref="address"/>
+				<xs:element ref="table"/>
+				<xs:element ref="a"/>
+				<xs:element ref="br"/>
+				<xs:element ref="span"/>
+				<xs:element ref="bdo"/>
+				<xs:element ref="object"/>
+				<xs:element ref="img"/>
+				<xs:element ref="map"/>
+				<xs:element ref="tt"/>
+				<xs:element ref="i"/>
+				<xs:element ref="b"/>
+				<xs:element ref="big"/>
+				<xs:element ref="small"/>
+				<xs:element ref="em"/>
+				<xs:element ref="strong"/>
+				<xs:element ref="dfn"/>
+				<xs:element ref="code"/>
+				<xs:element ref="q"/>
+				<xs:element ref="sub"/>
+				<xs:element ref="sup"/>
+				<xs:element ref="samp"/>
+				<xs:element ref="kbd"/>
+				<xs:element ref="var"/>
+				<xs:element ref="cite"/>
+				<xs:element ref="abbr"/>
+				<xs:element ref="acronym"/>
+			</xs:choice>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Text"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="d104"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TextAuthor">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TextAuthor"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="d107"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TextCaseFlag">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List14">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TextCaseFlag"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b027"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TextFormat">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List34">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TextFormat"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="d103"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TextItem">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="TextItemType"/>
+				<xs:element ref="TextItemIdentifier" minOccurs="0" maxOccurs="unbounded"/>
+				<xs:choice minOccurs="0">
+					<xs:sequence>
+						<xs:element ref="FirstPageNumber"/>
+						<xs:element ref="LastPageNumber" minOccurs="0"/>
+					</xs:sequence>
+					<xs:element ref="PageRun" maxOccurs="unbounded"/>
+				</xs:choice>
+				<xs:element ref="NumberOfPages" minOccurs="0"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TextItem"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="textitem"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TextItemIDType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List43">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TextItemIDType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b285"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TextItemIdentifier">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="TextItemIDType"/>
+				<xs:element ref="IDTypeName" minOccurs="0"/>
+				<xs:element ref="IDValue"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TextItemIdentifier"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="textitemidentifier"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TextItemType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List42">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TextItemType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b290"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TextLink">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TextLink"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="d106"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TextLinkType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List35">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TextLinkType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="d105"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TextPublicationDate">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TextPublicationDate"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="d109"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TextSourceCorporate">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TextSourceCorporate"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b374"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TextSourceTitle">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TextSourceTitle"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="d108"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TextTypeCode">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List33">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TextTypeCode"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="d102"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TextWithDownload">
+		<xs:complexType mixed="true">
+			<xs:choice minOccurs="0" maxOccurs="unbounded">
+				<xs:element ref="p"/>
+				<xs:element ref="h1"/>
+				<xs:element ref="h2"/>
+				<xs:element ref="h3"/>
+				<xs:element ref="h4"/>
+				<xs:element ref="h5"/>
+				<xs:element ref="h6"/>
+				<xs:element ref="div"/>
+				<xs:element ref="ul"/>
+				<xs:element ref="ol"/>
+				<xs:element ref="dl"/>
+				<xs:element ref="pre"/>
+				<xs:element ref="hr"/>
+				<xs:element ref="blockquote"/>
+				<xs:element ref="address"/>
+				<xs:element ref="table"/>
+				<xs:element ref="a"/>
+				<xs:element ref="br"/>
+				<xs:element ref="span"/>
+				<xs:element ref="bdo"/>
+				<xs:element ref="object"/>
+				<xs:element ref="img"/>
+				<xs:element ref="map"/>
+				<xs:element ref="tt"/>
+				<xs:element ref="i"/>
+				<xs:element ref="b"/>
+				<xs:element ref="big"/>
+				<xs:element ref="small"/>
+				<xs:element ref="em"/>
+				<xs:element ref="strong"/>
+				<xs:element ref="dfn"/>
+				<xs:element ref="code"/>
+				<xs:element ref="q"/>
+				<xs:element ref="sub"/>
+				<xs:element ref="sup"/>
+				<xs:element ref="samp"/>
+				<xs:element ref="kbd"/>
+				<xs:element ref="var"/>
+				<xs:element ref="cite"/>
+				<xs:element ref="abbr"/>
+				<xs:element ref="acronym"/>
+			</xs:choice>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TextWithDownload"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="f118"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ThesisPresentedTo">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ThesisPresentedTo"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b369"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ThesisType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List72">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ThesisType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b368"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ThesisYear">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ThesisYear"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b370"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Thickness">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Thickness"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="c098"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Title">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="TitleType"/>
+				<xs:element ref="AbbreviatedLength" minOccurs="0"/>
+				<xs:element ref="TextCaseFlag" minOccurs="0"/>
+				<xs:choice>
+					<xs:sequence>
+						<xs:element ref="TitleText"/>
+						<xs:sequence minOccurs="0">
+							<xs:element ref="TitlePrefix"/>
+							<xs:element ref="TitleWithoutPrefix"/>
+						</xs:sequence>
+					</xs:sequence>
+					<xs:sequence>
+						<xs:element ref="TitlePrefix"/>
+						<xs:element ref="TitleWithoutPrefix"/>
+					</xs:sequence>
+				</xs:choice>
+				<xs:element ref="Subtitle" minOccurs="0"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Title"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="title"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TitleOfSeries">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TitleOfSeries"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b018"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TitleOfSet">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TitleOfSet"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b023"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TitlePrefix">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TitlePrefix"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b030"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TitleText">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TitleText"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b203"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TitleType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List15">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TitleType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b202"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TitleWithoutPrefix">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TitleWithoutPrefix"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b031"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TitlesAfterNames">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TitlesAfterNames"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b043"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TitlesBeforeNames">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TitlesBeforeNames"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b038"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ToCompany">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ToCompany"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="m178"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ToEANNumber">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ToEANNumber"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="m176"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ToPerson">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ToPerson"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="m179"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="ToSAN">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="ToSAN"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="m177"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TradeAnnouncementDate">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TradeAnnouncementDate"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b362"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TradeCategory">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List12">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TradeCategory"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b384"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="TranslationOfTitle">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="TranslationOfTitle"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b032"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="UPC">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="UPC"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b006"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="USSchoolGrade">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="USSchoolGrade"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b189"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="UnnamedPersons">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List19">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="UnnamedPersons"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b249"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="UnpricedItemType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List57">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="UnpricedItemType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="j192"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Website">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="WebsiteRole" minOccurs="0"/>
+				<xs:element ref="WebsiteDescription" minOccurs="0"/>
+				<xs:element ref="WebsiteLink"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Website"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="website"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="WebsiteDescription">
+		<xs:complexType mixed="true">
+			<xs:choice minOccurs="0" maxOccurs="unbounded">
+				<xs:element ref="p"/>
+				<xs:element ref="h1"/>
+				<xs:element ref="h2"/>
+				<xs:element ref="h3"/>
+				<xs:element ref="h4"/>
+				<xs:element ref="h5"/>
+				<xs:element ref="h6"/>
+				<xs:element ref="div"/>
+				<xs:element ref="ul"/>
+				<xs:element ref="ol"/>
+				<xs:element ref="dl"/>
+				<xs:element ref="pre"/>
+				<xs:element ref="hr"/>
+				<xs:element ref="blockquote"/>
+				<xs:element ref="address"/>
+				<xs:element ref="table"/>
+				<xs:element ref="a"/>
+				<xs:element ref="br"/>
+				<xs:element ref="span"/>
+				<xs:element ref="bdo"/>
+				<xs:element ref="object"/>
+				<xs:element ref="img"/>
+				<xs:element ref="map"/>
+				<xs:element ref="tt"/>
+				<xs:element ref="i"/>
+				<xs:element ref="b"/>
+				<xs:element ref="big"/>
+				<xs:element ref="small"/>
+				<xs:element ref="em"/>
+				<xs:element ref="strong"/>
+				<xs:element ref="dfn"/>
+				<xs:element ref="code"/>
+				<xs:element ref="q"/>
+				<xs:element ref="sub"/>
+				<xs:element ref="sup"/>
+				<xs:element ref="samp"/>
+				<xs:element ref="kbd"/>
+				<xs:element ref="var"/>
+				<xs:element ref="cite"/>
+				<xs:element ref="abbr"/>
+				<xs:element ref="acronym"/>
+			</xs:choice>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="WebsiteDescription"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b294"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="WebsiteLink">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="WebsiteLink"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b295"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="WebsiteRole">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List73">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="WebsiteRole"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b367"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Weight">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Weight"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="c099"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="Width">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="Width"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="c097"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="WorkIDType">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="List16">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="WorkIDType"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b201"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="WorkIdentifier">
+		<xs:complexType>
+			<xs:sequence>
+				<xs:element ref="WorkIDType"/>
+				<xs:element ref="IDTypeName" minOccurs="0"/>
+				<xs:element ref="IDValue"/>
+			</xs:sequence>
+			<xs:attribute name="refname" type="xs:NMTOKEN" fixed="WorkIdentifier"/>
+			<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="workidentifier"/>
+			<xs:attributeGroup ref="generalAttributes"/>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="YearFirstPublished">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="YearFirstPublished"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b088"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:element name="YearOfAnnual">
+		<xs:complexType>
+			<xs:simpleContent>
+				<xs:extension base="NonEmptyString">
+					<xs:attribute name="refname" type="xs:NMTOKEN" fixed="YearOfAnnual"/>
+					<xs:attribute name="shortname" type="xs:NMTOKEN" fixed="b020"/>
+					<xs:attributeGroup ref="generalAttributes"/>
+				</xs:extension>
+			</xs:simpleContent>
+		</xs:complexType>
+	</xs:element>
+	<xs:simpleType name="NonEmptyString">
+		<xs:restriction base="xs:string">
+			<xs:minLength value="1"/>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:simpleType name="CountryCodeList">
+		<xs:list itemType="List91"/>
+	</xs:simpleType>
+	<xs:simpleType name="TerritoryCodeList">
+		<xs:list itemType="List49"/>
+	</xs:simpleType>
+	<xs:simpleType name="DateOrDateTime">
+		<xs:restriction base="xs:string">
+			<xs:pattern value="2\d\d\d(0[1-9]|1[0-2])((0[1-9]|1[0-9]|2[0-8])([01][0-9]|2[0-3])[0-5][0-9][0-5][0-9])?"/>
+			<xs:pattern value="2[048]0[048]0229(([01][0-9]|2[0-3])[0-5][0-9][0-5][0-9])?"/>
+			<xs:pattern value="2[1234569]0[48]0229(([01][0-9]|2[0-3])[0-5][0-9][0-5][0-9])?"/>
+			<xs:pattern value="2\d([2468][048]|[13579][26])0229(([01][0-9]|2[0-3])[0-5][0-9][0-5][0-9])?"/>
+			<xs:pattern value="2\d\d\d(0[13-9]|1[0-2])(29|30)(([01][0-9]|2[0-3])[0-5][0-9][0-5][0-9])?"/>
+			<xs:pattern value="2\d\d\d(0[13578]|1[02])31(([01][0-9]|2[0-3])[0-5][0-9][0-5][0-9])?"/>
+		</xs:restriction>
+	</xs:simpleType>
+	<xs:attributeGroup name="generalAttributes">
+		<xs:attribute name="textformat" type="TextFormatCode" use="optional" default="00"/>
+		<xs:attribute name="textcase" type="TextCaseCode" use="optional" default="00"/>
+		<xs:attribute name="language" type="List74" use="optional"/>
+		<xs:attribute name="transliteration" type="TransliterationCode" use="optional"/>
+		<xs:attribute name="datestamp" type="DateOrDateTime" use="optional"/>
+		<xs:attribute name="sourcetype" type="SourceTypeCode" use="optional" default="00"/>
+		<xs:attribute name="sourcename" type="xs:string" use="optional"/>
+	</xs:attributeGroup>
+</xs:schema>
diff --git a/ia-legacy-importer/onix/README b/ia-legacy-importer/onix/README
new file mode 100644
index 00000000..92ea16cc
--- /dev/null
+++ b/ia-legacy-importer/onix/README
@@ -0,0 +1,4 @@
+
+to test basic onix handling, you can run test-onix.sh
+with an onix file on standard input.
+
diff --git a/ia-legacy-importer/onix/__init__.py b/ia-legacy-importer/onix/__init__.py
new file mode 100644
index 00000000..bccec2ef
--- /dev/null
+++ b/ia-legacy-importer/onix/__init__.py
@@ -0,0 +1 @@
+"""onix"""
diff --git a/ia-legacy-importer/onix/config.sh b/ia-legacy-importer/onix/config.sh
new file mode 100644
index 00000000..cb97d4d0
--- /dev/null
+++ b/ia-legacy-importer/onix/config.sh
@@ -0,0 +1,7 @@
+#!/bin/sh -e
+
+export URL_CACHE_DIR=urlcache 				# a temporary directory
+export PHAROS_REPO="../.."						# the root of the Open Library repository
+export PYTHONPATH="$PHAROS_REPO"
+export PYTHON_INTERPRETER=python2.5
+
diff --git a/ia-legacy-importer/onix/import-log.sh b/ia-legacy-importer/onix/import-log.sh
new file mode 100755
index 00000000..8ec7c7af
--- /dev/null
+++ b/ia-legacy-importer/onix/import-log.sh
@@ -0,0 +1,3 @@
+#!/bin/sh
+
+exec env PHAROS_DBNAME=dbglog PHAROS_DBUSER=pharos PHAROS_DBPASS=pharos PHAROS_SITE=site0 PHAROS_LOGFILE=/1/dbg/import-logs/dbglog URL_CACHE_DIR=urlcache python2.4 onix-import.py
diff --git a/ia-legacy-importer/onix/import.sh b/ia-legacy-importer/onix/import.sh
new file mode 100755
index 00000000..a1656065
--- /dev/null
+++ b/ia-legacy-importer/onix/import.sh
@@ -0,0 +1,13 @@
+#!/bin/sh
+
+export PHAROS_DBNAME=dbgtest
+export PHAROS_DBUSER=dbg
+export PHAROS_SITE=site1
+
+export PHAROS_EDITION_PREFIX="b/"
+export PHAROS_AUTHOR_PREFIX="a/"
+
+export URL_CACHE_DIR=urlcache 
+export PYTHONPATH=/home/dbg/lib/python
+
+exec python2.4 onix-import.py
diff --git a/ia-legacy-importer/onix/onix-import.py b/ia-legacy-importer/onix/onix-import.py
new file mode 100644
index 00000000..5961ea10
--- /dev/null
+++ b/ia-legacy-importer/onix/onix-import.py
@@ -0,0 +1,229 @@
+import web
+import infogami.tdb as tdb
+from infogami.tdb import NotFound, Things, LazyThing
+from items import *
+from onix import parser
+import sys
+import unicodedata
+import re
+import os
+from lang import *
+from types import *
+
+source_name = None
+source_path = None
+edition_prefix = None
+author_prefix = None
+
+edition_records = set ([])
+item_names = {}
+#edition_names = set ([])
+#author_names = {}
+
+def setup ():
+	def getvar (name, required=True):
+		val = os.getenv (name)
+		if required and val is None:
+			raise Exception ("found no environment variable %s" % name)
+		return val
+	dbname = getvar ("PHAROS_DBNAME")
+	dbuser = getvar ("PHAROS_DBUSER")
+	dbpass = getvar ("PHAROS_DBPASS")
+	web.config.db_parameters = dict(dbn='postgres', db=dbname, user=dbuser, pw=dbpass)
+	web.db._hasPooling = False
+	web.config.db_printing = False
+	web.load()
+	tdb.setup()
+	logfile = getvar ("PHAROS_LOGFILE", False)
+	if logfile:
+		tdb.logger.set_logfile (open (logfile, "a"))
+		sys.stderr.write ("logging to %s\n" % logfile)
+
+	global source_name, source_path
+	source_dir = getvar ("PHAROS_SOURCE_DIR")
+	source_name = sys.argv[1]
+	source_path = "%s/%s" % (source_dir, source_name)
+
+	global edition_prefix, author_prefix
+	edition_prefix = getvar ("PHAROS_EDITION_PREFIX", False) or ""
+	author_prefix = getvar ("PHAROS_AUTHOR_PREFIX", False) or ""
+
+	setup_names ()
+
+def setup_names ():
+	global item_names, edition_records, source_name
+
+	warn ("walking the length and breadth of the database ...")
+	author_type = Author.type ()
+	edition_type = Edition.type ()
+	walked = 0
+	parent_id = site_object().id
+	for r in web.query ("SELECT id,name FROM thing WHERE parent_id = $parent_id", vars=locals()):
+		item_names[r.name] = r.id
+
+	for r in web.query ("SELECT d1.value FROM datum AS d1, datum AS d2 WHERE d1.version_id=d2.version_id AND d1.key='source_record_lineno' AND d2.key='source_name' AND d2.value=$source_name", { 'source_name': source_name }):
+		edition_records.add (int (r.value))
+
+	warn ("noted %d items" % len (item_names))
+	if len (edition_records) > 0:
+		warn ("already have %d records from this source; they will be ignored" % len (edition_records))
+
+def import_file (input):
+	n = 0
+	for x in parser (input):
+		n += 1
+		import_item (x)
+		if n % 100 == 0:
+			sys.stderr.write ("." * 30 + " read %d records\n" % n)
+	sys.stderr.write ("\nread %d records\n" % n)
+
+skipped = 0
+imported = 0
+
+def import_author (x):
+	name = author_prefix + name_string (x["name"])
+	a = None
+
+	global item_names
+	aid = item_names.get (name, None)
+	if aid:
+		a = LazyThing (aid)
+		# warn ("---------------------------> already author %s" % name)
+	else:
+		a = Author (name, d=massage_dict (x))
+		a.save ()
+		item_names[name] = a.id
+		# warn ("AUTHOR %s" % name)
+	return a
+
+def import_item (x):
+	global skipped, imported
+
+	global edition_records
+	lineno = x["source_record_lineno"]
+	if lineno in edition_records:
+		skipped += 1
+		if skipped % 100 == 0:
+			warn ("skipped %d" % skipped)
+		return
+
+	# import the authors
+	authors = map (import_author, x.get ("authors") or [])
+	if x.get ("authors"):
+		del x["authors"]
+
+	# find a unique name for the edition
+	global item_names
+	name = None
+	for n in edition_name_choices (x):
+		nn = edition_prefix + n
+		if nn not in item_names:
+			name = nn
+			break
+
+	if not name:
+		raise Exception ("couldn't find a unique name for %s" % x)
+
+	e = Edition (name, d=massage_dict (x))
+	global source_name
+	e.source_name = source_name
+	e.authors = authors
+	e.save ()
+	item_names[name] = e.id
+	edition_records.add (e.source_record_lineno)
+	imported += 1
+	if imported % 100 == 0:
+		warn ("imported %d" % imported)
+
+	# sys.stderr.write ("EDITION %s\n" % name)
+
+ignore_title_words = ['a', 'the']
+tsep = '_'
+
+def edition_name_choices (x):
+	# use up to 25 chars of title, including last word
+	title = name_safe (x['title'])
+	title_words = [ w for w in title.split() if w.lower() not in ignore_title_words ]
+	if len (title_words) == 0:
+		raise Exception ("no usable title chars")
+	ttail = title_words.pop (-1)
+	tlen = len (ttail)
+	name = ""
+	nlen = 1 + tlen
+	if title_words:
+		name = title_words.pop (0)
+		nlen = len (name) + 1 + tlen
+		while title_words:
+			w = title_words.pop (0)
+			wlen = len (w)
+			if nlen + 1 + wlen < 25:
+				name += "_" + w
+				nlen += 1 + wlen
+	if name:
+		name += "_"
+	name += ttail
+	name = name[0:30]
+	yield name
+
+	ed_number = x.get ('edition_number')
+	if ed_number:
+		name = tsep.join ([name, name_string (ed_number)])
+		yield name
+
+	ed_type = x.get ('edition_type')
+	if ed_type:
+		name = tsep.join ([name, name_string (ed_type)])
+		yield name
+
+	ed = x.get ('edition')
+	if ed:
+		name = tsep.join ([name, name_string (ed)])
+		yield name
+
+	format = x.get ('physical_format')
+	if format:
+		name = tsep.join ([name, name_string (format)])
+		yield name
+
+	nlen = len (name)
+	n = 0
+	while True:
+		name = name[:nlen] + tsep + "%d" % n
+		yield name
+		n += 1
+
+	return
+
+re_name_safe = re.compile (r'[^a-zA-Z0-9]')
+def name_safe (s):
+	s = asciify (s)
+	s = s.replace ("'", "")
+	return re.sub (re_name_safe, ' ', s)
+
+def name_string (s):
+	s = name_safe (s)
+	words = s.split ()
+	return '_'.join (words)
+
+def asciify (s):
+	return unicodedata.normalize('NFKD', s).encode('ASCII', 'ignore')
+
+def massage_value (v):
+	if (isinstance (v, UnicodeType)):
+		return v.encode ('utf8')
+	elif (isinstance (v, ListType)):
+		return map (massage_value, v)
+	else:
+		return v
+
+def massage_dict (d):
+	dd = {}
+	for (k, v) in d.iteritems ():
+		dd[k] = massage_value (v)
+	return dd
+
+if __name__ == "__main__":
+	setup()
+	sys.stderr.write ("--> setup finished\n")
+	import_file (open (source_path, "r"))
+	sys.stderr.write ("--> import finished\n")
diff --git a/ia-legacy-importer/onix/onix.py b/ia-legacy-importer/onix/onix.py
new file mode 100644
index 00000000..c0a2c2aa
--- /dev/null
+++ b/ia-legacy-importer/onix/onix.py
@@ -0,0 +1,190 @@
+from __future__ import print_function
+# wrapper code for easier handling of ONIX files:
+#
+# OnixHandler -- a sax ContentHandler that produces a stream of ONIX "product" data in xmltramp objects
+#
+# OnixProduct -- a wrapper for the objects produced by OnixHandler, providing human-friendly field access
+# (mostly just providing a dictionary interface where long ("reference") names can be used even when the
+# data is encoded with opaque ("short") names.)
+
+from xml.sax.handler import *
+from catalog.onix.sax_utils import *
+from catalog.onix import xmltramp
+
+repo_path = os.getenv ("PHAROS_REPO")
+codelists_path = "%s/%s" % (repo_path, "catalog/onix/ONIX_BookProduct_CodeLists.xsd")
+ref_dtd_path = "%s/%s" % (repo_path, "catalog/onix/ONIX_BookProduct_Release2.1_reference.xsd")
+
+# for testing, also set URL_CACHE_DIR; see bottom.
+
+onix_codelists = None
+onix_shortnames = None
+
+def init ():
+	f = open (codelists_path, "r")
+	onix_codelists = parse_codelists (f)
+	f.close ()
+	f = open (ref_dtd_path, "r")
+	onix_shortnames = parse_shortnames (f)
+	f.close ()
+
+class OnixProduct:
+	# N.B.: this only works when using the "short" names of elements.
+	# we should check that the document uses the short DTD, and if not,
+	# use the reference names to access field values.
+
+	def __init__ (self, p):
+		self.p = p
+
+	@staticmethod
+	def reify_child (v):
+		if len (v._dir) == 1 and isinstance (v._dir[0], StringTypes):
+			return v._dir[0]
+		else:
+			return OnixProduct (v)
+
+	def __getitem__ (self, n):
+		slicing = False
+		if isinstance (n, SliceType):
+			slicing = True
+			reference_name = n.start
+		else:
+			reference_name = n
+		name = OnixProduct.get_shortname (reference_name) # or reference_name.lower ()
+		values = self.p[name:]
+		if slicing:
+			return map (OnixProduct.reify_child, values)
+		else:
+			if len (values) == 0:
+				raise KeyError ("no value for %s (%s)" % (reference_name, name))
+			elif len (values) > 1:
+				raise Exception ("more than one value for %s (%s)" % (reference_name, name))
+			return OnixProduct.reify_child (values[0])
+
+	def get (self, n):
+		try:
+			return self.__getitem__ (n)
+		except KeyError:
+			return None
+
+	def getLineNumber (self):
+		return self.p.getLineNumber ()
+
+	def __unicode__ (self):
+		return self.p.__unicode__ ()
+
+	def __str__ (self):
+		return self.__unicode__ ()
+
+	def pi_type_name (code):
+		return onix_codelists["List5"][code][0]
+
+	@staticmethod
+	def contributor_role (code):
+		return onix_codelists["List17"][code][0]
+
+	@staticmethod
+	def get_shortname (reference_name):
+		try:
+			return onix_shortnames[reference_name]
+		except KeyError:
+			raise Exception ("unknown reference name: %s" % reference_name)
+
+class OnixHandler (ContentHandler):
+
+	def __init__ (self, parser, receiver):
+		self.parser = parser
+		self.receiver = receiver
+		self.subhandler = None
+		ContentHandler.__init__ (self)
+
+	def startElementNS (self, name, qname, attrs):
+		if self.subhandler:
+			self.subhandler.startElementNS (name, qname, attrs)
+			self.subdepth += 1
+		else:
+			(uri, localname) = name
+			if localname == "product":
+				self.subhandler = xmltramp.Seeder (self.parser)
+				self.subhandler.startElementNS (name, qname, attrs)
+				self.subdepth = 1
+
+	def endElementNS (self, name, qname):
+		if self.subhandler:
+			self.subhandler.endElementNS (name, qname)
+			self.subdepth -= 1
+			if self.subdepth == 0:
+				self.receiver (self.subhandler.result)
+				self.subhandler = None
+
+	def characters (self, content):
+		if self.subhandler:
+			self.subhandler.characters (content)
+
+def parse_shortnames (input):
+	def schema (name, attrs):
+		def element (name, attrs):
+			def typespec (name, attrs):
+				def attribute (name, attrs):
+					if (attrs.getValueByQName ('name') == "shortname"):
+						shortname = attrs.getValueByQName ('fixed')
+						return CollectorValue (shortname)
+					else:
+						return CollectorNone ()
+				return NodeCollector ({ 'attribute': attribute, collector_any: typespec })
+			elt_name = attrs.getValueByQName ('name')
+			return NamedCollector (elt_name, { collector_any: typespec })
+		return DictCollector ({ 'element': element })
+	return collector_parse (input, { 'schema': schema })
+
+def parse_codelists (input):
+	def schema (name, attrs):
+		def simpleType (name, attrs):
+			def restriction (name, attrs):
+				def enumeration (name, attrs):
+					def annotation (name, attrs):
+						def documentation (name, attrs):
+							return TextCollector ()
+						return ListCollector ({ 'documentation': documentation })
+					return NamedCollector (attrs.getValueByQName (u'value'), { 'annotation': annotation })
+				return DictCollector ({ 'enumeration': enumeration })
+			return NamedCollector (attrs.getValueByQName (u'name'), { 'restriction': restriction })
+		return DictCollector ({ 'simpleType': simpleType })
+	return collector_parse (input, { 'schema': schema })
+
+init ()
+
+### testing
+
+from xml.sax.saxutils import prepare_input_source
+
+class TestErrorHandler:
+	def error (self, exn):
+		raise exn
+	def fatalError (self, exn):
+		raise exn
+	def warning (self, exn):
+		sys.stderr.write ("warning: %s\n" % exn.getMessage)
+
+def produce_items (input, produce):
+	source = prepare_input_source (input)
+
+	parser = xml.sax.make_parser ()
+	parser.setFeature (xml.sax.handler.feature_namespaces, 1)
+	parser.setContentHandler (OnixHandler (parser, process_item))
+	url_cache_dir = os.getenv ("URL_CACHE_DIR")
+	if url_cache_dir:
+		sys.stderr.write ("using url cache in %s\n" % url_cache_dir)
+		parser.setEntityResolver (CachingEntityResolver (parser, url_cache_dir))
+	else:
+		sys.stderr.write ("no url_cache_dir; XML resources will always be loaded from network\n")
+	parser.setErrorHandler (TestErrorHandler ())
+	parser.parse (source)
+
+def process_item (i):
+	print(OnixProduct (i))
+
+if __name__ == "__main__":
+	from sys import stdin
+	print("Reading ONIX data from standard input ...")
+	produce_items (stdin, process_item)
diff --git a/ia-legacy-importer/onix/parse.py b/ia-legacy-importer/onix/parse.py
new file mode 100644
index 00000000..ccf771db
--- /dev/null
+++ b/ia-legacy-importer/onix/parse.py
@@ -0,0 +1,276 @@
+# provides a parser from ONIX files to Open Library items
+
+import re
+import sys
+import os
+from types import *
+from lang import *
+
+import xml.sax
+from xml.sax.handler import *
+from xml.sax.saxutils import prepare_input_source
+
+from thread_utils import AsyncChannel, threaded_generator
+from onix import OnixProduct, OnixHandler, onix_codelists
+
+import six
+
+def parser (input):
+	# returns a generator that produces dicts representing Open Library items
+
+	def produce_items (produce):
+		source = prepare_input_source (input)
+
+		parser = xml.sax.make_parser ()
+		parser.setFeature (xml.sax.handler.feature_namespaces, 1)
+		parser.setContentHandler (OnixHandler (parser, process_product))
+		url_cache_dir = os.getenv ("URL_CACHE_DIR")
+		if url_cache_dir:
+			sys.stderr.write ("using url cache in %s\n" % url_cache_dir)
+			parser.setEntityResolver (CachingEntityResolver (parser, url_cache_dir))
+		else:
+			sys.stderr.write ("no url_cache_dir; XML resources will always be loaded from network\n")
+		parser.setErrorHandler (MyErrorHandler ())
+		parser.parse (source)
+
+	return threaded_generator (produce_items, 50)
+
+def process_product (p):
+	op = OnixProduct (p)	# the incoming record
+	o = {}			# the Open Library item we're producing
+
+	# record id
+	o['source_record_lineno'] = p.getLineNumber ()
+
+	# title, subtitle
+	tt = [ t for t in op["Title":] if t["TitleType"] == '01' ]
+	if len (tt) > 1:
+		raise Exception ("more than one distinctive title")
+	elif len(tt) == 0:
+		raise Exception ("no distinctive title")
+	t = tt[0]
+	prefix = t.get ("TitlePrefix")
+	if prefix:
+		prefix = prefix.strip ()
+		o['title_prefix_len'] = len (prefix) + 1  # prefix plus space
+		o['title'] = prefix + " " + t["TitleWithoutPrefix"].strip ()
+	else:
+		title = t.get ("TitleText")
+		if title:
+			o['title'] = title
+	subtitle = t.get ("Subtitle")
+	if subtitle:
+		o['subtitle'] = subtitle
+
+	# id codes (ISBN, etc.)
+	for pi in op["ProductIdentifier":]:
+		pi_type = pi["ProductIDType"]
+		pi_val = pi["IDValue"]
+		if pi_type != '01':
+			type_name = str (OnixProduct.pi_type_name (pi_type)).replace ("-", "_")
+			o[type_name] = pi_val
+
+	# author, contributors
+	for c in op["Contributor":]:
+		role_codes = sorted(c["ContributorRole":])
+		role_code = role_codes[0]
+
+		name = person_name (c)
+		if not name:
+			warn ("=====> no name for contributor at line %d" % c.getLineNumber ())
+			continue
+
+		if role_code != 'A01':
+			role = OnixProduct.contributor_role (role_code)
+			add_val (o, "contributions", role + ": " + name)
+			continue
+
+		author = {}
+		author["name"] = name
+		add_val (o, "authors", author)
+
+		# iname = c.get ("PersonNameInverted")
+		# if iname:
+		# 	author["inverted_name"] = iname
+		# 	# XXX else construct inverted name from name parts
+
+		pnis = c["PersonNameIdentifier":]
+		if len (pnis) > 0:
+			warn ("got PersonNameIdentifier(s): %s" % pnis[0]["IDValue"])
+
+		# other_names = c["Name":]
+		# XX: for pseudonyms, etc. ... should stash this somewhere
+
+		for pdate in c["PersonDate":]:
+			role = pdate["PersonDateRole"]
+			# fmt = None
+			# fmt_code = pdate.get ("DateFormat")
+			# if fmt_code:
+			# 	fmt = onix_codelists["List55"][fmt_code]
+			date = pdate["Date"]
+			if role == "007": author["birth_date"] = date
+			elif role == "008": author["death_date"] = date
+			else: die ("bad date role: %s" % role)
+
+		bio = c.get ("BiographicalNote")
+		if bio:
+			author["bio"] = bio
+
+		# website
+		# country
+		# region
+
+	contrib = op.get ("ContributorStatement")
+	if not o.get ("authors"):
+		# XXX: shouldn't do this: the ContributorStatement could have anything in it
+		# ... but this is the only way to get author names for one of the catalogs
+		if contrib:
+			author = {}
+			author["name"] = re_by.sub ('', contrib)
+			add_val (o, "authors", author)
+
+	# edition
+	ed_type = op.get ("EditionTypeCode")
+	if ed_type:
+		o["edition_type"] = self.codelists["List21"][ed_type][0]
+	ed_number = op.get ("EditionNumber")
+	if ed_number:
+		ed_vers_num = op.get ("EditionVersionNumber")
+		if ed_vers_num:
+			ed_number += "-" + ed_vers_num
+		o["edition_number"] = ed_number
+	edition = op.get ("EditionStatement")
+	if edition:
+		o["edition"] = edition
+
+	# format
+	format = op.get ("ProductFormDescription")
+	if format:
+		o["physical_format"] = format
+	npages = op.get ("NumberOfPages")
+	if npages:
+		o["number_of_pages"] = npages
+	nillus = op.get ("NumberOfIllustrations")
+	if nillus:
+		o["number_of_illustrations"] = nillus
+	ill_note = op.get ("IllustrationsNote")
+	if ill_note:
+		add_val (o, "notes", ill_note)
+	# see also <illustrations> composite
+
+	# dimensions
+
+	# language
+	# (see also <language> composite)
+	lang_code = op.get ("LanguageOfText")
+	if lang_code:
+		o["language_code"] = lang_code
+		o["language"] = self.codelists["List74"][lang_code][0]
+
+	# subject
+	bisac = op.get ("BISACMainSubject")
+	if bisac:
+		add_val (o, "BISAC_subject_categories", bisac)
+	for subject in op["Subject":]:
+		scheme = subject.get ("SubjectSchemeIdentifier")
+		if scheme and scheme == "10":
+			code = subject.get ("SubjectCode")
+			if code:
+				add_val (o, "BISAC_subject_categories", code)
+
+	# description
+	for text in op["OtherText":]:
+		# type = text["TextTypeCode"]
+		format = text["TextFormat"]
+		if format not in ("00", "02", "07"): # ASCII, HTML, Basic ASCII
+			raise Exception ("unsupported description format: %s" % self.codelists["List34"][format][0])
+		if o.get ("description"):
+			o["description"] += "\n" + text["Text"]
+		else:
+			o["description"] = text["Text"]
+	if not o.get ("description"):
+		descr = op.get ("MainDescription")
+		if descr:
+			o["description"] = descr
+
+	self.receiver (o)
+
+	# publisher
+	for pub in op["Publisher":]:
+		role = pub.get ("PublishingRole")
+		if role is None or role == "01":
+			name = pub.get ("PublisherName")
+			if name:
+				o["publisher"] = name
+			break
+	if not o.get ("publisher"):
+		pub = op.get ("PublisherName")
+		if pub:
+			o["publisher"] = pub
+
+	# imprint
+	imprint = op.get ("Imprint")
+	if imprint:
+		name = imprint.get ("ImprintName")
+		if name:
+			o["imprint"] = name
+	if not o.get ("imprint"):
+		imprint = op.get ("ImprintName")
+		if imprint:
+			o["imprint"] = imprint
+
+	# publish_status
+	pstat = op.get ("PublishingStatus")
+	if pstat and pstat != "??":
+		status = self.codelists["List64"][pstat][0]
+		pstatnote = op.get ("PublishingStatusNote")
+		if pstatnote:
+			stats += ": " + pstatnote
+		o["publish_status"] = status
+
+	# publish_date
+	pdate = op.get ("PublicationDate")
+	if pdate:
+		o["publish_date"] = pdate # YYYY[MM[DD]]
+		# XXX: need to convert
+
+class MyErrorHandler:
+	def error (self, exn):
+		raise exn
+	def fatalError (self, exn):
+		raise exn
+	def warning (self, exn):
+		sys.stderr.write ("warning: %s\n" % exn.getMessage)
+
+name_parts = ["TitlesBeforeNames", "NamesBeforeKey", "PrefixToKey", "KeyNames", "NamesAfterKey", "SuffixToKey"]
+def person_name (x):
+	global name_parts
+	name = x.get ("PersonName")
+	if not name:
+		parts = [ p for p in map (lambda p: x.get (p), name_parts) if p ]
+		name = " ".join (parts)
+	if not name:
+		iname = x.get ("PersonNameInverted")
+		if iname:
+			# XXX this often works, but is not reliable;
+			# shouldn't really mess with unstructured names
+			m = re_iname.match (iname)
+			if m:
+				name = m.group (2) + " " + m.group (1)
+			else:
+				name = iname
+	if not name:
+		name = x.get ("CorporateName")
+	return name
+
+def elt_get (e, tag, reference_name):
+     ee = e.get (tag) or e.get (reference_name.lower ())
+     return six.text_type(ee) if ee else None
+
+
+re_by = re.compile ("^\s*by\s+", re.IGNORECASE)
+re_iname = re.compile ("^(.*),\s*(.*)$")
+
+def add_val (o, key, val):
+	if val is not None:
+		o.setdefault (key, []).append (val)
diff --git a/ia-legacy-importer/onix/sax_utils.py b/ia-legacy-importer/onix/sax_utils.py
new file mode 100644
index 00000000..9aa01aa1
--- /dev/null
+++ b/ia-legacy-importer/onix/sax_utils.py
@@ -0,0 +1,177 @@
+import os
+from types import *
+from urlcache import URLCache
+import xml.sax
+from xml.sax.handler import *
+import sys
+
+from six.moves import urllib
+
+
+class CachingEntityResolver (EntityResolver):
+	def __init__ (self, parser, dir):
+		self.parser = parser
+		if not os.path.isdir (dir):
+			raise Exception ("CachingEntityResolver: no such directory: %s" % dir)
+		self.cache = URLCache (dir)
+
+	def resolveEntity (self, pubid, sysid):
+		parser_sysid = self.parser.getSystemId ()
+		src = None
+		if sysid.startswith ("http:"):
+			src = self.resolveURL (sysid)
+		elif isinstance (parser_sysid, StringTypes) and parser_sysid.startswith ("http:"):
+			src = self.resolveURL (sysid, parser_sysid)
+		if not src:
+			src = EntityResolver.resolveEntity (self, p, s)
+		return src
+
+	def resolveURL (self, sysid, base = ""):
+		url = urllib.parse.urljoin (base, sysid)
+		source = xml.sax.xmlreader.InputSource (url)
+		f = self.cache.get (url)
+		source.setByteStream (f)
+		return source
+
+def collector_parse (input, dispatch):
+	parser = xml.sax.make_parser ()
+	parser.setFeature (xml.sax.handler.feature_namespaces, 1)
+	handler = CollectorHandler (parser, dispatch)
+	# parser.setContentHandler (handler)	# CollectorHandler sets ContentHandler
+	parser.parse (input)
+	return handler.get_value ()
+
+class CollectorHandler:
+	def __init__ (self, parser, base):
+		self.parser = parser
+		base_collector = None
+		if isinstance (base, Collector):
+			base_collector = base
+		else:
+			base_collector = NodeCollector (base)
+		self.collectors = [base_collector]
+		base_collector.start (None, self)
+		self.set_handler ()
+
+	def get_value (self):
+		if len (self.collectors) == 1:
+			return self.collectors[0].finish ()
+		else:
+			raise Exception ("CollectorHandler.get_value(): collection not finished")
+
+	def top_collector (self):
+		if not len (self.collectors):
+			return None
+		else:
+			return self.collectors[-1]
+
+	def push_collector (self, collector):
+		self.collectors.append (collector)
+		self.set_handler ()
+
+	def pop_collector (self):
+		self.collectors.pop ()
+		self.set_handler ()
+
+	def set_handler (self):
+		self.parser.setContentHandler (self.top_collector ())
+
+class Collector (ContentHandler):
+	def start (self, parent, handler):
+		self.parent = parent
+		self.handler = handler
+	def end (self):
+		self.handler.pop_collector ()
+		self.handler = None
+		value = self.finish ()
+		if not isinstance (value, CollectorNoneValue):
+			self.parent.collect (value)
+		self.parent = None
+	def finish (self):
+		pass
+	def endElementNS (self, name, qname):
+		self.end ()
+
+class TextCollector (Collector):
+	def __init__ (self):
+		self.value = None
+	def characters (self, content):
+		self.value = content
+	def finish (self):
+		return self.value
+
+class NodeCollector (Collector):
+	def __init__ (self, collector_table, strict=False):
+		self.collector_table = collector_table
+		self.strict = strict
+		self.ignoring = 0
+		self.value = collector_none
+	def startElementNS (self, name, qname, attrs):
+		if self.ignoring:
+			self.ignoring += 1
+		else:
+			(uri, localname) = name
+			c_maker = self.collector_table.get (localname) or self.collector_table.get (collector_any)
+			if c_maker:
+				c = c_maker (name, attrs)
+				c.start (self, self.handler)
+				self.handler.push_collector (c)
+			else:
+				if self.strict:
+					raise Exception ("no handler for element '%s'; handlers: %s" % (localname, self.collector_table.keys ()))
+				else:
+					self.ignoring += 1
+	def endElementNS (self, name, qname):
+		if self.ignoring:
+			self.ignoring -= 1
+		else:
+			self.end ()
+	def collect (self, value):
+		self.value = value
+	def finish (self):
+		return self.value
+
+class NamedCollector (NodeCollector):
+	def __init__ (self, name, collector_table):
+		NodeCollector.__init__ (self, collector_table)
+		self.name = name
+	def finish (self):
+		if self.value is collector_none:
+			return collector_none
+		else:
+			return (self.name, self.value)
+
+class ListCollector (NodeCollector):
+	def __init__ (self, collector_table):
+		NodeCollector.__init__ (self, collector_table)
+		self.values = []
+	def collect (self, value):
+		self.values.append (value)
+	def finish (self):
+		return self.values
+
+class DictCollector (NodeCollector):
+	def __init__ (self, collector_table):
+		NodeCollector.__init__ (self, collector_table)
+		self.values = {}
+	def collect (self, key_value):
+		(key, value) = key_value
+		if self.values.get (key):
+			raise Exception ("dictionary key '%s' is already mapped" % key)
+		else:
+			self.values[key] = value
+	def finish (self):
+		return self.values
+
+class CollectorValue (NodeCollector):
+	def __init__ (self, val):
+		NodeCollector.__init__ (self, {}, strict=False)
+		self.collect (val)
+
+class CollectorNoneValue: pass
+collector_none = CollectorNoneValue ()
+def CollectorNone ():
+	return CollectorValue (collector_none)
+
+class CollectorAnyElement: pass
+collector_any = CollectorAnyElement ()
diff --git a/ia-legacy-importer/onix/test-onix.sh b/ia-legacy-importer/onix/test-onix.sh
new file mode 100755
index 00000000..b33eb8f4
--- /dev/null
+++ b/ia-legacy-importer/onix/test-onix.sh
@@ -0,0 +1,6 @@
+#!/bin/sh -e
+
+. ./config.sh
+
+exec $PYTHON_INTERPRETER onix.py
+
diff --git a/ia-legacy-importer/onix/thread_utils.py b/ia-legacy-importer/onix/thread_utils.py
new file mode 100644
index 00000000..f8167212
--- /dev/null
+++ b/ia-legacy-importer/onix/thread_utils.py
@@ -0,0 +1,85 @@
+# 2007 dbg for the Internet Archive
+
+import sys
+from threading import Thread, Lock, Condition
+
+from six import reraise
+
+class AsyncChannel:
+	# yes, i believe this is just Queue ... i was new to python and couldn't find it
+
+	def __init__ (self, buffer_size=1):
+		self.buffer = []
+		self.max_items = buffer_size
+		self.lock = Lock ()
+		self.not_empty = Condition (self.lock)
+		self.not_full = Condition (self.lock)
+
+	def get (self):
+		self.lock.acquire ()
+		while len (self.buffer) == 0:
+			self.not_empty.wait ()
+		val = self.buffer.pop (0)
+		self.not_full.notifyAll ()
+		self.lock.release ()
+		return val
+
+	def put (self, val):
+		self.lock.acquire ()
+		while len (self.buffer) == self.max_items:
+			self.not_full.wait ()
+		self.buffer.append (val)
+		self.not_empty.notifyAll ()
+		self.lock.release ()
+
+class ForeignException:
+
+	def __init__ (self, exc_type, exc_value, exc_traceback):
+		self.exc_type = exc_type
+		self.exc_value = exc_value
+		self.exc_traceback = exc_traceback
+
+	def re_raise (self):
+		reraise(self.exc_type, self.exc_value, self.exc_traceback)
+
+def ForeignException_extract ():
+	(exc_type, exc_value, exc_traceback) = sys.exc_info()
+	return ForeignException (exc_type, exc_value, exc_traceback)
+
+def threaded_generator (producer, buffer_size=1):
+	# the producer function will be invoked with a single argument, a "produce" function.
+	# the producer may pass an object to this "produce" function any number of times before
+	# returning.  the values thus passed will, in turn, be produced by the generator which
+	# is the return value of threaded_generator().
+	#
+	# this provides a sort of coroutine facility, because python's generators can't do that:
+	# they can only yield values from the bottom of the call stack.  sometimes you need to
+	# keep control context between producing values.
+
+	t = None
+	chan = AsyncChannel (buffer_size)
+
+	def produce (val):
+		chan.put (val)
+
+	def main ():
+		try:
+			producer (produce)
+			chan.put (StopIteration ())
+		except:
+			chan.put (ForeignException_extract ())
+
+	def generator ():
+		while True:
+			v = chan.get ()
+			if isinstance (v, StopIteration):
+				break
+			if isinstance (v, ForeignException):
+				v.re_raise ()
+			else:
+				yield v
+
+	t = Thread (target=main)
+	t.setDaemon (True)
+	t.start ()
+	return generator ()
diff --git a/ia-legacy-importer/onix/urlcache.py b/ia-legacy-importer/onix/urlcache.py
new file mode 100644
index 00000000..ac5d9298
--- /dev/null
+++ b/ia-legacy-importer/onix/urlcache.py
@@ -0,0 +1,76 @@
+import sys
+import os
+import time
+import shutil
+import traceback
+from fcntl import *
+
+from six.moves import urllib
+
+
+class URLCache:
+	def __init__ (self, dir):
+		self.dir = dir
+
+	def get_entries (self):
+		entries = {}
+		index_file = self.dir + "/index"
+		next = 0
+		index = open (index_file, "a")	# create index file if it doesn't exist
+		index.close ()
+		index = open (index_file, "r+")
+		flock (index, LOCK_EX)
+
+		for url in index:
+			entries[url.rstrip ()] = next
+			next += 1
+		return (entries, next, index)
+
+	def get (self, url):
+		url = url.strip ()
+		(entries, next, index) = self.get_entries ()
+		id = entries.get (url)
+		if id is None:
+			# with index locked, add an entry for this url and
+			# open a locked, temporary file to load its data
+			index.seek (0, 2)
+			index.write ("%s\n" % url)
+			data_file = self.dir + "/" + str (next)
+			tmp_data_file = data_file + "-fetching"
+			tmp_data = open (tmp_data_file, "w")
+			flock (tmp_data, LOCK_EX)
+			index.close ()
+
+			# having released the lock on the index, suck data
+			# into the temporary file
+			sys.stderr.write ("URLCache: fetching %s\n" % url)
+			net_data = urllib.request.urlopen (url)
+			shutil.copyfileobj (net_data, tmp_data)
+			tmp_data.flush ()
+			os.link (tmp_data_file, data_file)  # the fetch is good: attach it
+			tmp_data.close ()		    # drop lock on temporary file
+			os.unlink (tmp_data_file)
+			id = next
+
+		else:
+			# there is already an entry for this url, so release the lock on the index
+			index.close ()
+
+		data_file = self.dir + "/" + str (id)
+		if os.path.exists (data_file):
+			return open (data_file, "r")
+		else:
+			# wait for fetch to finish
+			tmp_data_file = data_file + "-fetching"
+			sys.stderr.write ("URLCache: waiting for %s\n" % data_file)
+			try:
+				try:
+					tmp_data = open (tmp_data_file)
+					flock (tmp_data, LOCK_SH)
+					tmp_data.close ()
+				except OSError as e:
+					pass
+				return open (data_file, "r")
+			except Exception as exn:
+				# in case this happens, just blow away your cache
+				raise Exception ("URLCache: sorry, corrupted state for url '%s': %s" % (url, str (exn)))
diff --git a/ia-legacy-importer/onix/xmltramp.py b/ia-legacy-importer/onix/xmltramp.py
new file mode 100644
index 00000000..7d681cde
--- /dev/null
+++ b/ia-legacy-importer/onix/xmltramp.py
@@ -0,0 +1,375 @@
+"""xmltramp: Make XML documents easily accessible."""
+
+__version__ = "2.17"
+__author__ = "Aaron Swartz"
+__credits__ = "Many thanks to pjz, bitsko, and DanC."
+__copyright__ = "(C) 2003-2006 Aaron Swartz. GNU GPL 2."
+
+import six
+
+def isstr(f): return isinstance(f, type('')) or isinstance(f, type(u''))
+def islst(f): return isinstance(f, type(())) or isinstance(f, type([]))
+
+empty = {'http://www.w3.org/1999/xhtml': ['img', 'br', 'hr', 'meta', 'link', 'base', 'param', 'input', 'col', 'area']}
+
+def quote(x, elt=True):
+    if elt and '<' in x and len(x) > 24 and x.find(']]>') == -1: return "<![CDATA["+x+"]]>"
+    else: x = x.replace('&', '&amp;').replace('<', '&lt;').replace(']]>', ']]&gt;')
+    if not elt: x = x.replace('"', '&quot;')
+    return x
+
+@six.python_2_unicode_compatible
+class Element:
+    def __init__(self, name, attrs=None, children=None, prefixes=None, line=None):
+        if islst(name) and name[0] == None: name = name[1]
+        if attrs:
+            na = {}
+            for k in attrs.keys():
+                if islst(k) and k[0] == None: na[k[1]] = attrs[k]
+                else: na[k] = attrs[k]
+            attrs = na
+
+        self._name = name
+        self._attrs = attrs or {}
+        self._dir = children or []
+
+        prefixes = prefixes or {}
+        self._prefixes = dict(zip(prefixes.values(), prefixes.keys()))
+
+        if prefixes: self._dNS = prefixes.get(None, None)
+        else: self._dNS = None
+
+        self._line = line
+
+    def __repr__(self, recursive=0, multiline=0, inprefixes=None):
+        def qname(name, inprefixes):
+            if islst(name):
+                if inprefixes[name[0]] is not None:
+                    return inprefixes[name[0]]+':'+name[1]
+                else:
+                    return name[1]
+            else:
+                return name
+
+        def arep(a, inprefixes, addns=1):
+            out = ''
+
+            for p in self._prefixes.keys():
+                if not p in inprefixes.keys():
+                    if addns: out += ' xmlns'
+                    if addns and self._prefixes[p]: out += ':'+self._prefixes[p]
+                    if addns: out += '="'+quote(p, False)+'"'
+                    inprefixes[p] = self._prefixes[p]
+
+            for k in a.keys():
+                out += ' ' + qname(k, inprefixes)+ '="' + quote(a[k], False) + '"'
+
+            return out
+
+        inprefixes = inprefixes or {u'http://www.w3.org/XML/1998/namespace':'xml'}
+
+        # need to call first to set inprefixes:
+        attributes = arep(self._attrs, inprefixes, recursive)
+        out = '<' + qname(self._name, inprefixes)  + attributes
+
+        if not self._dir and (self._name[0] in empty.keys()
+          and self._name[1] in empty[self._name[0]]):
+            out += ' />'
+            return out
+
+        out += '>'
+
+        if recursive:
+            content = 0
+            for x in self._dir:
+                if isinstance(x, Element): content = 1
+
+            pad = '\n' + ('\t' * recursive)
+            for x in self._dir:
+                if multiline and content: out +=  pad
+                if isstr(x): out += quote(x)
+                elif isinstance(x, Element):
+                    out += x.__repr__(recursive+1, multiline, inprefixes.copy())
+                else:
+                    raise TypeError("I wasn't expecting "+ repr(x) +".")
+            if multiline and content: out += '\n' + ('\t' * (recursive-1))
+        else:
+            if self._dir: out += '...'
+
+        out += '</'+qname(self._name, inprefixes)+'>'
+
+        return out
+
+    def __str__(self):
+        text = ''
+        for x in self._dir:
+            text += six.text_type(x)
+        return ' '.join(text.split())
+
+    def __getattr__(self, n):
+        if n[0] == '_': raise AttributeError("Use foo['"+n+"'] to access the child element.")
+        if self._dNS: n = (self._dNS, n)
+        for x in self._dir:
+            if isinstance(x, Element) and x._name == n: return x
+        raise AttributeError('No child element named %s' % repr(n))
+
+    def __hasattr__(self, n):
+        for x in self._dir:
+            if isinstance(x, Element) and x._name == n: return True
+        return False
+
+    def __setattr__(self, n, v):
+        if n[0] == '_': self.__dict__[n] = v
+        else: self[n] = v
+
+
+    def __getitem__(self, n):
+        if isinstance(n, type(0)): # d[1] == d._dir[1]
+            return self._dir[n]
+        elif isinstance(n, slice(0).__class__):
+            # numerical slices
+            if isinstance(n.start, type(0)): return self._dir[n.start:n.stop]
+
+            # d['foo':] == all <foo>s
+            n = n.start
+            if self._dNS and not islst(n): n = (self._dNS, n)
+            out = []
+            for x in self._dir:
+                if isinstance(x, Element) and x._name == n: out.append(x)
+            return out
+        else: # d['foo'] == first <foo>
+            if self._dNS and not islst(n): n = (self._dNS, n)
+            for x in self._dir:
+                if isinstance(x, Element) and x._name == n: return x
+            raise KeyError
+
+    def __setitem__(self, n, v):
+        if isinstance(n, type(0)): # d[1]
+            self._dir[n] = v
+        elif isinstance(n, slice(0).__class__):
+            # d['foo':] adds a new foo
+            n = n.start
+            if self._dNS and not islst(n): n = (self._dNS, n)
+
+            nv = Element(n)
+            self._dir.append(nv)
+
+        else: # d["foo"] replaces first <foo> and dels rest
+            if self._dNS and not islst(n): n = (self._dNS, n)
+
+            nv = Element(n); nv._dir.append(v)
+            replaced = False
+
+            todel = []
+            for i in range(len(self)):
+                if self[i]._name == n:
+                    if replaced:
+                        todel.append(i)
+                    else:
+                        self[i] = nv
+                        replaced = True
+            if not replaced: self._dir.append(nv)
+            for i in todel: del self[i]
+
+    def __delitem__(self, n):
+        if isinstance(n, type(0)): del self._dir[n]
+        elif isinstance(n, slice(0).__class__):
+            # delete all <foo>s
+            n = n.start
+            if self._dNS and not islst(n): n = (self._dNS, n)
+
+            for i in range(len(self)):
+                if self[i]._name == n: del self[i]
+        else:
+            # delete first foo
+            for i in range(len(self)):
+                if self[i]._name == n: del self[i]
+                break
+
+    def __call__(self, *_pos, **_set):
+        if _set:
+            for k in _set.keys(): self._attrs[k] = _set[k]
+        if len(_pos) > 1:
+            for i in range(0, len(_pos), 2):
+                self._attrs[_pos[i]] = _pos[i+1]
+        if len(_pos) == 1:
+            return self._attrs[_pos[0]]
+        if len(_pos) == 0:
+            return self._attrs
+
+    def __len__(self): return len(self._dir)
+
+    def get(self, n):
+        try:
+            return self.__getitem__(n)
+        except KeyError:
+            return None
+
+    def getLineNumber (self):
+        return self._line
+
+class Namespace:
+    def __init__(self, uri): self.__uri = uri
+    def __getattr__(self, n): return (self.__uri, n)
+    def __getitem__(self, n): return (self.__uri, n)
+
+from xml.sax.handler import EntityResolver, DTDHandler, ContentHandler, ErrorHandler
+
+class Seeder(EntityResolver, DTDHandler, ContentHandler, ErrorHandler):
+    def __init__(self, parser=None):
+        if parser:
+            self.getLineNumber = lambda: parser.getLineNumber ()
+        else:
+            self.getLineNumber = lambda: None
+        self.stack = []
+        self.ch = ''
+        self.prefixes = {}
+        ContentHandler.__init__(self)
+
+    def startPrefixMapping(self, prefix, uri):
+        if prefix not in self.prefixes: self.prefixes[prefix] = []
+        self.prefixes[prefix].append(uri)
+    def endPrefixMapping(self, prefix):
+        self.prefixes[prefix].pop()
+
+    def startElementNS(self, name, qname, attrs):
+        ch = self.ch; self.ch = ''
+        if ch and not ch.isspace(): self.stack[-1]._dir.append(ch)
+
+        attrs = dict(attrs)
+        newprefixes = {}
+        for k in self.prefixes.keys(): newprefixes[k] = self.prefixes[k][-1]
+
+        self.stack.append(Element(name, attrs, prefixes=newprefixes.copy(), line=self.getLineNumber ()))
+
+    def characters(self, ch):
+        self.ch += ch
+
+    def endElementNS(self, name, qname):
+        ch = self.ch; self.ch = ''
+        if ch and not ch.isspace(): self.stack[-1]._dir.append(ch)
+
+        element = self.stack.pop()
+        if self.stack:
+            self.stack[-1]._dir.append(element)
+        else:
+            self.result = element
+
+from xml.sax import make_parser
+from xml.sax.handler import feature_namespaces
+
+def seed(fileobj):
+    seeder = Seeder()
+    parser = make_parser()
+    parser.setFeature(feature_namespaces, 1)
+    parser.setContentHandler(seeder)
+    parser.parse(fileobj)
+    return seeder.result
+
+def parse(text):
+    from six import StringIO
+    return seed(StringIO(text))
+
+def load(url):
+    import urllib
+    return seed(urllib.urlopen(url))
+
+def unittest():
+    parse('<doc>a<baz>f<b>o</b>ob<b>a</b>r</baz>a</doc>').__repr__(1,1) == \
+      '<doc>\n\ta<baz>\n\t\tf<b>o</b>ob<b>a</b>r\n\t</baz>a\n</doc>'
+
+    assert str(parse("<doc />")) == ""
+    assert str(parse("<doc>I <b>love</b> you.</doc>")) == "I love you."
+    assert parse("<doc>\nmom\nwow\n</doc>")[0].strip() == "mom\nwow"
+    assert str(parse('<bing>  <bang> <bong>center</bong> </bang>  </bing>')) == "center"
+    assert str(parse('<doc>\xcf\x80</doc>')) == '\xcf\x80'
+
+    d = Element('foo', attrs={'foo':'bar'}, children=['hit with a', Element('bar'), Element('bar')])
+
+    try:
+        d._doesnotexist
+        raise Exception("ExpectedError but found success. Damn.")
+    except AttributeError: pass
+    assert d.bar._name == 'bar'
+    try:
+        d.doesnotexist
+        raise Exception("ExpectedError but found success. Damn.")
+    except AttributeError: pass
+
+    assert hasattr(d, 'bar') == True
+
+    assert d('foo') == 'bar'
+    d(silly='yes')
+    assert d('silly') == 'yes'
+    assert d() == d._attrs
+
+    assert d[0] == 'hit with a'
+    d[0] = 'ice cream'
+    assert d[0] == 'ice cream'
+    del d[0]
+    assert d[0]._name == "bar"
+    assert len(d[:]) == len(d._dir)
+    assert len(d[1:]) == len(d._dir) - 1
+    assert len(d['bar':]) == 2
+    d['bar':] = 'baz'
+    assert len(d['bar':]) == 3
+    assert d['bar']._name == 'bar'
+
+    d = Element('foo')
+
+    doc = Namespace("http://example.org/bar")
+    bbc = Namespace("http://example.org/bbc")
+    dc = Namespace("http://purl.org/dc/elements/1.1/")
+    d = parse("""<doc version="2.7182818284590451"
+      xmlns="http://example.org/bar"
+      xmlns:dc="http://purl.org/dc/elements/1.1/"
+      xmlns:bbc="http://example.org/bbc">
+            <author>John Polk and John Palfrey</author>
+            <dc:creator>John Polk</dc:creator>
+            <dc:creator>John Palfrey</dc:creator>
+            <bbc:show bbc:station="4">Buffy</bbc:show>
+    </doc>""")
+
+    assert repr(d) == '<doc version="2.7182818284590451">...</doc>'
+    assert d.__repr__(1) == '<doc xmlns:bbc="http://example.org/bbc" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns="http://example.org/bar" version="2.7182818284590451"><author>John Polk and John Palfrey</author><dc:creator>John Polk</dc:creator><dc:creator>John Palfrey</dc:creator><bbc:show bbc:station="4">Buffy</bbc:show></doc>'
+    assert d.__repr__(1,1) == '<doc xmlns:bbc="http://example.org/bbc" xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns="http://example.org/bar" version="2.7182818284590451">\n\t<author>John Polk and John Palfrey</author>\n\t<dc:creator>John Polk</dc:creator>\n\t<dc:creator>John Palfrey</dc:creator>\n\t<bbc:show bbc:station="4">Buffy</bbc:show>\n</doc>'
+
+    assert repr(parse("<doc xml:lang='en' />")) == '<doc xml:lang="en"></doc>'
+
+    assert str(d.author) == str(d['author']) == "John Polk and John Palfrey"
+    assert d.author._name == doc.author
+    assert str(d[dc.creator]) == "John Polk"
+    assert d[dc.creator]._name == dc.creator
+    assert str(d[dc.creator:][1]) == "John Palfrey"
+    d[dc.creator] = "Me!!!"
+    assert str(d[dc.creator]) == "Me!!!"
+    assert len(d[dc.creator:]) == 1
+    d[dc.creator:] = "You!!!"
+    assert len(d[dc.creator:]) == 2
+
+    assert d[bbc.show](bbc.station) == "4"
+    d[bbc.show](bbc.station, "5")
+    assert d[bbc.show](bbc.station) == "5"
+
+    e = Element('e')
+    e.c = '<img src="foo">'
+    assert e.__repr__(1) == '<e><c>&lt;img src="foo"></c></e>'
+    e.c = '2 > 4'
+    assert e.__repr__(1) == '<e><c>2 > 4</c></e>'
+    e.c = 'CDATA sections are <em>closed</em> with ]]>.'
+    assert e.__repr__(1) == '<e><c>CDATA sections are &lt;em>closed&lt;/em> with ]]&gt;.</c></e>'
+    e.c = parse('<div xmlns="http://www.w3.org/1999/xhtml">i<br /><span></span>love<br />you</div>')
+    assert e.__repr__(1) == '<e><c><div xmlns="http://www.w3.org/1999/xhtml">i<br /><span></span>love<br />you</div></c></e>'
+
+    e = Element('e')
+    e('c', 'that "sucks"')
+    assert e.__repr__(1) == '<e c="that &quot;sucks&quot;"></e>'
+
+
+    assert quote("]]>") == "]]&gt;"
+    assert quote('< dkdkdsd dkd sksdksdfsd fsdfdsf]]> kfdfkg >') == '&lt; dkdkdsd dkd sksdksdfsd fsdfdsf]]&gt; kfdfkg >'
+
+    assert parse('<x a="&lt;"></x>').__repr__(1) == '<x a="&lt;"></x>'
+    assert parse('<a xmlns="http://a"><b xmlns="http://b"/></a>').__repr__(1) == '<a xmlns="http://a"><b xmlns="http://b"></b></a>'
+
+if __name__ == '__main__': unittest()
diff --git a/ia-legacy-importer/people/build_object.py b/ia-legacy-importer/people/build_object.py
new file mode 100644
index 00000000..9fcc6a8d
--- /dev/null
+++ b/ia-legacy-importer/people/build_object.py
@@ -0,0 +1,64 @@
+from openlibrary.catalog.utils import flip_name, pick_first_date
+
+
+def build_person_object(p, marc_alt):
+    ab = [(k, v.strip(' /,;:')) for k, v in p if k in 'ab']
+
+    has_b = any(k=='b' for k, v in p)
+
+    orig_name = ' '.join(v if k == 'a' else v for k, v in ab)
+    c = ' '.join(v for k, v in p if k == 'c')
+    name = flip_name(orig_name)
+    if name[0].isdigit():
+        name = orig_name
+    else:
+        of_count = c.count('of ')
+    #    if of_count == 1 and not has_b and 'of the ' not in c:
+    #        if c.startswith('King')
+    #
+    #        if c.startswith('Queen'):
+    #        name += ' ' + c[c.find('of '):]
+    #
+        if of_count == 1 and 'of the ' not in c and 'Emperor of ' not in c:
+            name += ' ' + c[c.find('of '):]
+        elif ' ' not in name and of_count > 1:
+            name += ', ' + c
+        elif c.endswith(' of') or c.endswith(' de') and any(k == 'a' and ', ' in v for k, v in p):
+            name = ' '.join(v for k, v in ab)
+            c += ' ' + name[:name.find(', ')]
+            name = name[name.find(', ') + 2:] + ', ' + c
+
+    person = {}
+    d = [v for k, v in p if k =='d']
+    if d:
+        person = pick_first_date(d)
+    person['name'] = name
+    person['sort'] = orig_name
+
+    if any(k=='b' for k, v in p):
+        person['enumeration'] = ' '.join(v for k, v in p if k == 'b')
+
+    if c:
+        person['title'] = c
+    person['marc'] = [p] + list(marc_alt)
+
+    return person
+
+def test_consort():
+    line = (('a', u'Elizabeth'), ('c', u'Empress, consort of Franz Joseph, Emperor of Austria'))
+    p = build_person_object(marc, [])
+    p['name'] == u'Empress Elizabeth, consort of Franz Joseph, Emperor of Austria',
+
+    line = (('a', u'Mary'), ('c', u'Queen, Consort of George V, King of Great Britain'), ('d', u'1867-1953'))
+    p = build_person_object(marc, [])
+    p['name'] == u'Queen Mary, Consort of George V, King of Great Britain'
+
+def test_king_no_number():
+    marc = (('a', u'Henry'), ('b', u'IV'), ('c', u'King of England'), ('d', u'1367-1413'))
+    p = build_person_object(marc, [])
+    assert p['name'] == u'Henry IV of England'
+
+    marc = (('a', u'John'), ('c', u'King of England'), ('d', u'1167-1216'))
+    p = build_person_object(marc, [])
+    assert p['name'] == 'King John of England'
+
diff --git a/ia-legacy-importer/people/from_works.py b/ia-legacy-importer/people/from_works.py
new file mode 100644
index 00000000..58530672
--- /dev/null
+++ b/ia-legacy-importer/people/from_works.py
@@ -0,0 +1,143 @@
+from __future__ import print_function
+from openlibrary.catalog.utils.query import query_iter, set_staging, get_mc
+from openlibrary.catalog.get_ia import get_data
+from openlibrary.catalog.marc.fast_parse import get_tag_lines, get_all_subfields, get_subfields
+
+from pprint import pprint
+from identify_people import read_people
+from build_object import build_person_object
+import sys
+from collections import defaultdict
+
+set_staging(True)
+
+def work_and_marc():
+    i = 0
+    skip = True
+    for w in query_iter({'type': '/type/work', 'title': None}):
+        if skip:
+            if w['key'] == '/w/OL56814W':
+                skip = False
+            else:
+                continue
+        marc = set()
+        q = {'type': '/type/edition', 'works': w['key'], 'title': None, 'source_records': None}
+        for e in query_iter(q):
+            if e.get('source_records', []):
+                marc.update(i[5:] for i in e['source_records'] if i.startswith('marc:'))
+            mc = get_mc(e['key'])
+            if mc and not mc.startswith('ia:') and not mc.startswith('amazon:'):
+                marc.add(mc)
+        if marc:
+            yield w, marc
+        else:
+            print('no marc:', w)
+
+
+def read_works():
+    i = 0
+    pages = {}
+    page_marc = {}
+
+    for work, marc in work_and_marc():
+        lines = []
+        for loc in marc:
+            data = get_data(loc)
+            if not data:
+                continue
+            found = [v for k, v in get_tag_lines(data, set(['600']))]
+            if found:
+                lines.append((loc, found))
+        if not lines:
+            continue
+        work['lines'] = lines
+        i += 1
+        print(i, work['key'], work['title'])
+
+        try:
+            people, marc_alt = read_people(j[1] for j in lines)
+        except AssertionError:
+            print(work['lines'])
+            continue
+        except KeyError:
+            print(work['lines'])
+            continue
+
+        marc_alt_reverse = defaultdict(set)
+        for k, v in marc_alt.items():
+            marc_alt_reverse[v].add(k)
+
+        w = ol.get(work['key'])
+        w['subject_people'] = []
+        for p, num in people.iteritems():
+            print('  %2d %s' % (num, ' '.join("%s: %s" % (k, v) for k, v in p)))
+            print('     ', p)
+            if p in page_marc:
+                w['subject_people'].append({'key': '/subjects/people/' + page_marc[p]})
+                continue
+            obj = build_person_object(p, marc_alt_reverse.get(p, []))
+            key = obj['name'].replace(' ', '_')
+            full_key = '/subjects/people/' + key
+            w['subject_people'].append({'key': full_key})
+
+            if key in pages:
+                print(key)
+                pages[key]['marc'].append(p)
+                continue
+
+            for m in obj['marc']:
+                page_marc[m] = key
+
+            pages[key] = obj
+            obj_for_db = obj.copy()
+            del obj_for_db['marc']
+            obj_for_db['key'] = full_key
+            obj_for_db['type'] = '/type/person'
+            print(ol.save(full_key.encode('utf-8'), obj_for_db, 'create a new person page'))
+
+        print(w)
+        print(ol.save(w['key'], w, 'add links to people that this work is about'))
+
+def from_sample():
+    i = 0
+    pages = {}
+    page_marc = {}
+    for line in open('work_and_marc5'):
+        i += 1
+        w = eval(line)
+#        print i, w['key'], w['title']
+#        print w['lines']
+        try:
+            people, marc_alt = read_people(j[1] for j in w['lines'])
+        except AssertionError:
+            print([j[1] for j in w['lines']])
+            raise
+        marc_alt_reverse = defaultdict(set)
+        for k, v in marc_alt.items():
+            marc_alt_reverse[v].add(k)
+
+        for p, num in people.iteritems():
+            if p in page_marc:
+                continue
+            obj = build_person_object(p, marc_alt_reverse.get(p, []))
+            key = obj['name'].replace(' ', '_')
+            for m in obj['marc']:
+                page_marc[m] = key
+            if key in pages:
+#                print key
+#                print p
+#                for m in pages[key]['marc']:
+#                    print m
+#                print
+                pages[key]['marc'].append(p)
+            else:
+                pages[key] = obj
+#                pprint(obj)
+#                continue
+                if obj['name'][1].isdigit():
+                    print([j[1] for j in w['lines']])
+                    pprint(obj)
+#                assert not obj['name'][1].isdigit()
+
+from_sample()
+#read_works()
diff --git a/ia-legacy-importer/people/identify_people.py b/ia-legacy-importer/people/identify_people.py
new file mode 100644
index 00000000..7c8126b1
--- /dev/null
+++ b/ia-legacy-importer/people/identify_people.py
@@ -0,0 +1,997 @@
+from __future__ import print_function
+from openlibrary.catalog.marc.cmdline import fmt_subfields
+from openlibrary.catalog.marc.fast_parse import get_subfields, get_all_subfields
+from openlibrary.catalog.utils import remove_trailing_dot, remove_trailing_number_dot, match_with_bad_chars, pick_first_date
+import openlibrary.catalog.utils.authority as authority
+from openlibrary.catalog.merge.normalize import normalize
+from collections import defaultdict
+import re
+
+def strip_death(date):
+    return date[:date.rfind('-')+1]
+
+def test_strip_death():
+    assert strip_death("1850-1910") == "1850-"
+
+re_dates = re.compile(' (\d{2,4}-(?:\d{2,4})?)$')
+re_dates_in_field = re.compile('^(\d{2,4})-((?:\d{2,4})?)$')
+re_dates_in_field_bc = re.compile('^(\d{2,4}) B\.C\.-((?:\d{2,4}) B\.C\.?)$')
+
+def test_transpose_date():
+    assert transpose_date(u'1452') == u'1425'
+
+def transpose_date(date):
+    return date[:-2] + date[-1] + date[-2]
+
+def is_date_transposed(d1, d2):
+    m1 = re_dates_in_field.match(d1)
+    m2 = re_dates_in_field.match(d2)
+    if not m1 and not m2:
+        m1 = re_dates_in_field_bc.match(d1)
+        m2 = re_dates_in_field_bc.match(d2)
+    if not m1 or not m2:
+        return False
+
+    if m1.group(1) == m2.group(1):
+        death1 = m1.group(2)
+        death2 = m2.group(2)
+        if not death1 or not death2:
+            return False
+        return transpose_date(death1) == death2
+    if m1.group(2) == m2.group(2):
+        birth1 = m1.group(1)
+        birth2 = m2.group(1)
+        return transpose_date(birth1) == birth2
+    return False
+
+def test_is_date_transposed():
+    assert is_date_transposed(u'1452-1485', u'1425-1485')
+
+def dates_not_close(d1, d2):
+    m1 = re_dates_in_field.match(d1)
+    if not m1:
+        return False
+    m2 = re_dates_in_field.match(d2)
+    if not m2:
+        return False
+
+    birth1 = int(m1.group(1))
+    birth2 = int(m2.group(1))
+    if abs(birth1 - birth2) >= 10:
+        return True
+
+    if not m1.group(2) or not m2.group(2):
+        return False
+
+    death1 = int(m1.group(2))
+    death2 = int(m2.group(2))
+    return abs(death1 - death2) >= 10
+
+def test_dates_not_close():
+    assert dates_not_close('1825-1899', '1804-1849')
+    assert not dates_not_close(u'1907-2003', u'1909-')
+    assert not dates_not_close('1825-1899', '1826-1898')
+
+def combinations(iterable, r):
+    # combinations('ABCD', 2) --> AB AC AD BC BD CD
+    # combinations(range(4), 3) --> 012 013 023 123
+    pool = tuple(iterable)
+    n = len(pool)
+    if r > n:
+        return
+    indices = range(r)
+    yield tuple(pool[i] for i in indices)
+    while True:
+        for i in reversed(range(r)):
+            if indices[i] != i + n - r:
+                break
+        else:
+            return
+        indices[i] += 1
+        for j in range(i+1, r):
+            indices[j] = indices[j-1] + 1
+        yield tuple(pool[i] for i in indices)
+
+def tidy_subfield(v):
+    return remove_trailing_dot(v.strip(' /,;:'))
+
+re_bc_date = re.compile('(\d+)B\.C\.')
+
+def clean_subfield(k, v):
+    if k in 'abc':
+        v = tidy_subfield(v)
+    elif k == 'd':
+        v = remove_trailing_number_dot(v.strip(' ,'))
+        v = re_bc_date.sub(lambda m: m.group(1) + " B.C.", v)
+    return (k, v)
+
+def has_subtag(a, subfields):
+    return any(k==a for k, v in subfields)
+
+def question_date(p1, p2):
+    marc_date1 = tuple(v for k, v in p1 if k =='d')
+    if not marc_date1:
+        return
+    marc_date2 = tuple(v for k, v in p2 if k =='d')
+    if not marc_date1 or not marc_date2 or marc_date1 == marc_date2:
+        return
+
+    assert len(marc_date1) == 1 and len(marc_date2) == 1
+
+    name1 = tuple((k, v) for k, v in p1 if k !='d')
+    name2 = tuple((k, v) for k, v in p2 if k !='d')
+    if name1 != name2:
+        return
+
+    marc_date1 = marc_date1[0]
+    question1 = '?' in marc_date1
+
+    marc_date2 = marc_date2[0]
+    question2 = '?' in marc_date2
+
+    if (not question1 and not question2) or (question1 and question2):
+        return # xor
+
+    if marc_date1.replace('?', '') != marc_date2.replace('?', ''):
+        return
+    return 1 if question1 else 2
+
+def get_marc_date(p):
+    marc_date = tuple(v for k, v in p if k =='d')
+    if not marc_date:
+        return
+    assert len(marc_date) == 1
+    return marc_date[0].strip()
+
+def build_by_name(found):
+    by_name = defaultdict(set)
+    for p in found:
+        if has_subtag('d', p):
+            without_date = tuple(i for i in p if i[0] != 'd')
+            by_name[without_date].add(p)
+
+    return by_name
+
+def build_name_and_birth(found):
+    # one author missing death date
+    name_and_birth = defaultdict(set)
+    for p in found:
+        d = get_marc_date(p)
+        if not d or d[-1] == '-' or '-' not in d:
+            continue
+        without_death = tuple((k, (v if k!='d' else strip_death(v))) for k, v in p)
+#        assert without_death not in name_and_birth
+        name_and_birth[without_death].add(p)
+    return name_and_birth
+
+def authority_lookup(to_check, found, marc_alt):
+    found_matches = False
+    for person_key, match in to_check.items():
+        if len(match) == 1:
+            continue
+        if len(match) == 2:
+            d1, d2 = [get_marc_date(p) for p in match]
+            if dates_not_close(d1, d2) and not is_date_transposed(d1, d2):
+                continue
+
+        name = ' '.join(v.strip() for k, v in person_key if k != 'd')
+        search_results = authority.search(name)
+        match_dates = dict((get_marc_date(p), p) for p in match)
+        norm_name = normalize(name)
+        authority_match = None
+        for i in search_results:
+            if i['type'] != 'personal name' or i['a'] == 'reference':
+                continue
+            if norm_name not in normalize(i['heading']):
+                continue
+            for d, p in match_dates.items():
+                if i['heading'].endswith(d):
+                    if authority_match: # more than one match
+                        print('dups:', match_dates.items())
+                        authority_match = None
+                        break
+                    authority_match = p
+        if authority_match:
+            for p in match:
+                if p == authority_match:
+                    continue
+                found[authority_match] += found.pop(p)
+                marc_alt[p] = authority_match
+                found_matches = True
+    return found_matches
+
+def subtag_should_be_c(found, marc_alt):
+    merge = []
+    for p1, p2 in combinations(found, 2):
+        if len(p1) != len(p2):
+            continue
+
+        subtag1 = [k for k, v in p1 if k in 'abcdq']
+        subtag2 = [k for k, v in p2 if k in 'abcdq']
+
+        if subtag1 == subtag2:
+            continue
+
+        def no_question_if_d(p):
+            return [v.replace('?', '') if k == 'd' else tidy_subfield(v) for k, v in p]
+        if no_question_if_d(p1) != no_question_if_d(p2):
+            continue
+
+        for i in range(len(subtag1)):
+            if subtag1[i] == subtag2[i]:
+                continue
+            assert len(p1[i][1]) >= 5
+
+            if subtag1[i] == 'c':
+                assert subtag2[i] in 'bq'
+                merge.append((p1, p2))
+            else:
+                assert subtag1[i] in 'bq' and subtag2[i] == 'c'
+                merge.append((p2, p1))
+            break
+
+    for a, b in merge:
+        if b not in found:
+            continue
+        found[a] += found.pop(b)
+        marc_alt[b] = a
+
+def merge_question_date(found, marc_alt):
+    merge = []
+    for p1, p2 in combinations(found, 2):
+        primary = question_date(p1, p2)
+        if primary is None:
+            continue
+        if primary == 1:
+            merge.append((p1, p2))
+        else:
+            assert primary == 2
+            merge.append((p2, p1))
+
+    for a, b in merge:
+        found[a] += found.pop(b)
+        marc_alt[b] = a
+
+re_bad_marc = re.compile(' ?\$ ?[a-z] ')
+def remove_bad_marc_subtag(s):
+    s = re_bad_marc.sub(' ', s)
+    return s
+
+def test_remove_bad_marc_subtag():
+    assert remove_bad_marc_subtag('John, $ c King of England') == 'John, King of England'
+
+
+def just_abcdq(p):
+    return tuple((k, v) for k, v in p if k in 'abcdq')
+
+def similar_dates(found, marc_alt):
+    # 1516 == d. 1516
+    merge = []
+    for p1, p2 in combinations(found, 2):
+        subtag1 = [k for k, v in p1]
+        subtag2 = [k for k, v in p2]
+        if subtag1 != subtag2:
+            continue
+        if [(k, v) for k, v in p1 if k != 'd'] != [(k, v) for k, v in p2 if k != 'd']:
+            continue
+        d1 = [v for k, v in p1 if k == 'd']
+        d2 = [v for k, v in p2 if k == 'd']
+        if d1 == d2:
+            continue
+        assert len(d1) == 1 and len(d2) == 1
+        d1, d2 = d1[0], d2[0]
+        if d1 == 'd. ' + d2:
+            merge.append((p1, p2))
+            continue
+        if d2 == 'd. ' + d1:
+            merge.append((p2, p1))
+            continue
+
+    for a, b in merge:
+        if b not in found:
+            continue
+        found[a] += found.pop(b)
+        marc_alt[b] = a
+
+re_simple_date = re.compile('^(\d+)-(\d+)?\.?$')
+
+def fix_bad_subtags(found, marc_alt):
+    just_values = defaultdict(lambda:defaultdict(int))
+    for p, num in found.items():
+        just_values[tuple(v.strip(',') for k, v in p)][p] += num
+
+    for a, b in just_values.items():
+        if len(b) == 1:
+            continue
+        b = sorted(b.items(), key=lambda i:i[1])
+        if b[-1][1] == b[-2][1]:
+            continue
+        new = b.pop()[0]
+        for i, j in b:
+            found[new] += found.pop(i)
+            marc_alt[i] = new
+
+def wrong_subtag_on_date(found, marc_alt):
+    for p in found.keys():
+        found_simple_date = False
+        for k, v in p:
+            if k != 'd' and re_simple_date.match(v):
+                found_simple_date = True
+                break
+        if not found_simple_date:
+            continue
+        new = tuple((('d' if k !='d' and re_simple_date.match(v) else k), v) for k, v in p)
+        if new in found:
+            found[new] += found.pop(p)
+            marc_alt[p] = new
+
+def missing_subtag(found, marc_alt):
+    merge = defaultdict(set)
+    for p1, p2 in combinations(found, 2):
+        subtag1 = [k for k, v in p1 if k in 'abcdq']
+        subtag2 = [k for k, v in p2 if k in 'abcdq']
+
+        if subtag1 == subtag2:
+            continue
+
+        name1 = ' '.join(v.strip() for k, v in p1)
+        name2 = ' '.join(v.strip() for k, v in p2)
+
+        if not match_with_bad_chars(name1, name2) \
+                and normalize(name1) != normalize(name2) \
+                and normalize(remove_bad_marc_subtag(name1)) != normalize(remove_bad_marc_subtag(name2)) \
+                and normalize(name1.lower().replace(' the', '')) != normalize(name2.lower().replace(' the', '')):
+            continue
+
+        if len(subtag1) > len(subtag2):
+            merge[p2].add(just_abcdq(p1))
+        else:
+            merge[p1].add(just_abcdq(p2))
+
+    def flat_len(p):
+        return len(' '.join(v for k, v in p))
+
+    for old, new in merge.items():
+        by_size = sorted((flat_len(p), p) for p in new)
+        if len(by_size) > 1:
+            assert by_size[-1][0] > by_size[-2][0]
+        new_marc = by_size[-1][1]
+
+        found[new_marc] += found.pop(old)
+        marc_alt[old] = new_marc
+
+def date_field_missing(p):
+    if has_subtag('d', p):
+        return p
+    assert has_subtag('a', p)
+    for k, v in p:
+        if k == 'a':
+            a = v
+            break
+    m = re_dates.search(a)
+    if not m:
+        return p
+    d = m.group(1)
+    a = tidy_subfield(a[:m.start()])
+    new = []
+    for k, v in p:
+        if k == 'a' and a:
+            new.append(('a', a))
+            a = None
+            continue
+        if k not in ('b', 'c') and d:
+            new.append(('d', d))
+            d = None
+        new.append((k, v))
+    if d:
+        new.append(('d', d))
+    return tuple(new)
+
+def bad_char_name_match(found, marc_alt):
+    merge = []
+    for p1, p2 in combinations(found, 2):
+        if p1 == p2:
+            continue
+        if get_marc_date(p1) != get_marc_date(p2):
+            continue
+        p1, p2 = sorted([p1, p2], key=lambda i:found[i])
+        if found[p1] != found[p2]:
+            name1 = ' '.join(v for k, v in p1 if k in 'abc')
+            name2 = ' '.join(v for k, v in p2 if k in 'abc')
+            if match_with_bad_chars(name1, name2):
+                found[p2] += found.pop(p1)
+                marc_alt[p1] = p2
+
+    for a, b in merge:
+        if b not in found:
+            continue
+        found[a] += found.pop(b)
+        marc_alt[b] = a
+
+def check_for_dup_a(p):
+    for a1, a2 in combinations((v for k, v in p if k == 'a'), 2):
+        assert a1 != a2
+
+def read_people(people):
+    found = defaultdict(int)
+    marc_alt = {}
+    people = list(people)
+
+    for lines in people:
+        for line in lines:
+            p = tuple(clean_subfield(k, v) for k, v in get_all_subfields(line))
+            #check_for_dup_a(p)
+            found[date_field_missing(p)]+=1
+
+    for p in found.keys():
+        c = None
+        for k, v in p:
+            if k == 'c':
+                c = v
+                break
+        if not c or c.lower() != 'family':
+            continue
+        new = tuple((k, v + ' family' if k == 'a' else v) for k, v in p if k != 'c')
+        if new in found:
+            found[new] += found.pop(p)
+            marc_alt[p] = new
+
+    fix_bad_subtags(found, marc_alt)
+
+    wrong_subtag_on_date(found, marc_alt)
+
+    try:
+        missing_subtag(found, marc_alt)
+    except AssertionError:
+        print(people)
+        raise
+
+    found_name = defaultdict(int)
+    for p, num in found.items():
+        found_name[just_abcdq(p)] += num
+    found = found_name
+
+    assert found
+
+    if len(found) == 1:
+        return dict(found), marc_alt
+
+    #for func in subtag_should_be_c, merge_question_date:
+    #for func in subtag_should_be_c, merge_question_date, missing_subtag, bad_char_name_match:
+    for func in subtag_should_be_c, merge_question_date, bad_char_name_match, similar_dates:
+        func(found, marc_alt)
+
+        if len(found) == 1:
+            return dict(found), marc_alt
+
+    assert found
+
+    # one author missing death date
+    name_and_birth = build_name_and_birth(found)
+
+    assert found
+
+    try:
+        if authority_lookup(name_and_birth, found, marc_alt):
+            if len(found) == 1:
+                return dict(found), marc_alt
+
+            name_and_birth = build_name_and_birth(found)
+    except AssertionError:
+        print(people)
+        raise
+
+    assert found
+
+    for p, num in found.items():
+        if p not in name_and_birth:
+            continue
+        assert len(name_and_birth[p]) == 1
+        new_name = list(name_and_birth[p])[0]
+        found[new_name] += found.pop(p)
+        marc_alt[p] = new_name
+
+    assert found
+
+    if len(found) == 1:
+        return dict(found), marc_alt
+
+    # match up authors with the same name
+    # where one has dates and the other doesn't
+    by_name = build_by_name(found)
+
+    try:
+        if authority_lookup(by_name, found, marc_alt):
+            if len(found) == 1:
+                return dict(found), marc_alt
+            by_name = build_by_name(found) # rebuild
+    except AssertionError:
+        print(people)
+        raise
+
+    for p, num in found.items():
+        if p not in by_name:
+            continue
+        if len(by_name[p]) != 1:
+            for i in by_name[p]:
+                print(i)
+            print(people)
+        assert len(by_name[p]) == 1
+        new_name = list(by_name[p])[0]
+        found[new_name] += found.pop(p)
+        marc_alt[p] = new_name
+    assert found
+
+    if len(found) == 1:
+        return dict(found), marc_alt
+
+    by_date = defaultdict(set)
+    for p in found:
+        if not has_subtag('d', p):
+            continue
+        d = tuple(v for k, v in p if k=='d')
+        by_date[d].add(p)
+#    for k, v in by_date.iteritems():
+#        print len(v), k, v
+
+    return dict(found), marc_alt
+
+def read_files():
+    read_file('work_and_marc2')
+    read_file('work_and_marc3')
+
+def read_file(filename):
+    for file_line in open(filename):
+        w = eval(file_line)
+        if len(w['lines']) == 1:
+            continue
+        lines = [i[1] for i in w['lines']]
+        print(w['key'], w['title'])
+        print(lines)
+        people, marc_alt = read_people(lines)
+#        for p, num in people.iteritems():
+#            if any(k=='d' for k, v in people):
+#                continue
+        for p, num in people.iteritems():
+            print('  %2d %s' % (num, ' '.join("%s: %s" % (k, v) for k, v in p)))
+            print('     ', p)
+        print()
+#read_file()
+
+def test_accents():
+    lines = [
+        ['00\x1faB\xe5adar\xe5aya\xf2na.\x1ftBrahmas\xe5utra.\x1e'],
+        ['00\x1faB\xe5adar\xe5aya\xf2na.\x1ftBrahmas\xe5utra.\x1e'],
+        ['00\x1faB\xe5adar\xe5aya\xf2na.\x1ftBrahmas\xe5utra.\x1e'],
+        ['00\x1faB\xe5adar\xe5aya\xf2na.\x1ftBrahmas\xe5utra.\x1e'],
+        ['00\x1faB\xe5adar\xe5aya\xf2na.\x1ftBrahmas\xe5utra.\x1e'],
+        ['00\x1faB\xe5adar\xe5ayana.\x1ftBrahmas\xe5utra.\x1e']
+    ]
+    a, b = read_people(lines)
+    assert a == {(('a', u'B\u0101dar\u0101ya\u1e47a'),): 6}
+    assert b == { (('a', u'B\u0101dar\u0101yana'),): (('a', u'B\u0101dar\u0101ya\u1e47a'),)}
+
+def test_same_name_one_date_missing():
+    lines = [
+        ['10\x1faAbedin, Zainul\x1fxCriticism and interpretation.\x1e'],
+        ['10\x1faAbedin, Zainul,\x1fd1914-1976\x1fxCriticism and interpretation.\x1e'],
+
+        ['10\x1faAbedin, Zainul\x1fxCriticism and interpretation.\x1e'],
+        ['10\x1faAbedin, Zainul,\x1fd1914-1976\x1fxCriticism and interpretation.\x1e']
+    ]
+    a, b = read_people(lines)
+
+    assert a == {(('a', u'Abedin, Zainul'), ('d', u'1914-1976')): 4}
+    assert b == {(('a', u'Abedin, Zainul'),): (('a', u'Abedin, Zainul'), ('d', u'1914-1976'))}
+
+def test_matching_name_missing_death():
+    lines = [
+        ['10\x1faFrisch, Max,\x1fd1911-1991\x1e'],
+        ['10\x1faFrisch, Max,\x1fd1911-\x1e'],
+        ['10\x1faFrisch, Max,\x1fd1911-\x1e']
+    ]
+    a, b = read_people(lines)
+    assert a == {(('a', u'Frisch, Max'), ('d', u'1911-1991')): 3}
+    assert b == {(('a', u'Frisch, Max'), ('d', u'1911-')): (('a', u'Frisch, Max'), ('d', u'1911-1991'))}
+
+def test_matching_dates():
+    lines = [
+        ['00\x1faMichelangelo Buonarroti,\x1fd1475-1564.\x1e'],
+        ['00\x1faMichelangelo Buonarroti,\x1fd1475-1564.\x1e'],
+        ['16\x1faBuonarroti, Michel Angelo,\x1fd1475-1564.\x1e']
+    ]
+    a, b = read_people(lines)
+
+def test_harold_osman_kelly():
+    lines = [
+        ['10\x1faKelly, Harold Osman,\x1fd1884-1955.\x1e'],
+        ['10\x1faKelly, Harold Osman,\x1fd1884-1956.\x1e']
+    ]
+    a, b = read_people(lines)
+    assert a == {(('a', u'Kelly, Harold Osman'), ('d', u'1884-1955')): 2}
+    assert b == {(('a', u'Kelly, Harold Osman'), ('d', u'1884-1956')): (('a', u'Kelly, Harold Osman'), ('d', u'1884-1955'))}
+
+def test_question_date():
+    lines = [
+        ['10\x1faBurke, Edmund,\x1fd1729?-1797.\x1ftReflections on the revolution in France.\x1e', '10\x1faCalonne,\x1fcM. de\x1fq(Charles Alexandre de),\x1fd1734-1802.\x1e'],
+        ['10\x1faBurke, Edmund,\x1fd1729-1797.\x1ftReflections on the Revolution in France.\x1e']
+    ]
+    a, b = read_people(lines)
+    assert a == {
+        (('a', u'Burke, Edmund'), ('d', u'1729?-1797')): 2,
+        (('a', u'Calonne'), ('c', u'M. de'), ('q', u'(Charles Alexandre de),'), ('d', u'1734-1802')): 1
+    }
+
+    assert b == {
+        (('a', u'Burke, Edmund'), ('d', u'1729-1797')): (('a', u'Burke, Edmund'), ('d', u'1729?-1797'))
+    }
+
+
+def test_pope_sixtus():
+    lines = [
+        ['00\x1faSixtus\x1fbV,\x1fcPope,\x1fd1521-1590.\x1e'],
+        ['04\x1faSixtus\x1fbV,\x1fcPope.\x1e'],
+        ['00\x1faSixtus\x1fbV,\x1fcPope,\x1fd1520-1590.\x1e']
+    ]
+    a, b = read_people(lines)
+    assert a == {
+        ((u'a', u'Sixtus'), (u'b', u'V'), (u'c', u'Pope'), (u'd', u'1520-1590')): 3
+    }
+
+    assert b == {
+        (('a', u'Sixtus'), ('b', u'V'), ('c', u'Pope')): (('a', u'Sixtus'), ('b', u'V'), ('c', u'Pope'), ('d', u'1520-1590')),
+        (('a', u'Sixtus'), ('b', u'V'), ('c', u'Pope'), ('d', u'1521-1590')): (('a', u'Sixtus'), ('b', u'V'), ('c', u'Pope'), ('d', u'1520-1590'))
+    }
+
+def test_william_the_conqueror():
+    lines = [
+        ['00\x1faWilliam\x1fbI,\x1fcKing of England,\x1fd1027 or 8-1087.\x1e'], ['04\x1faWilliam\x1fbI,\x1fcKing of England,\x1fd1027?-1087.\x1e'],
+        ['00\x1faWilliam\x1fbI,\x1fcKing of England,\x1fd1027 or 8-1087.\x1e'], ['00\x1faWilliam\x1fbI,\x1fcKing of England,\x1fd1027 or 8-1087\x1e'],
+        ['00\x1faWilliam\x1fbI,\x1fcKing of England,\x1fd1027 or 8-1087.\x1e'], ['00\x1faWilliam\x1fbI,\x1fcKing of England,\x1fd1027 or 8-1087.\x1e']
+    ]
+    a, b = read_people(lines)
+
+    assert a == {(('a', u'William'), ('b', u'I'), ('c', u'King of England'), ('d', u'1027 or 8-1087')): 6}
+    assert b == {(('a', u'William'), ('b', u'I'), ('c', u'King of England'), ('d', u'1027?-1087')): (('a', u'William'), ('b', u'I'), ('c', u'King of England'), ('d', u'1027 or 8-1087'))}
+
+def test_missing_d():
+    lines = [
+        [' 0\x1faDickens, Charles, 1812-1870\x1fxManuscripts\x1fxFacsimiles.\x1e'],
+        ['10\x1faDickens, Charles,\x1fd1812-1870\x1fxManuscripts\x1fxFacsimiles.\x1e']
+    ]
+    a, b = read_people(lines)
+    assert a == {(('a', u'Dickens, Charles'), ('d', u'1812-1870')): 2}
+    #assert b == {(('a', u'Dickens, Charles, 1812-1870'),): (('a', u'Dickens, Charles'), ('d', u'1812-1870'))}
+    assert b == {}
+
+def test_missing_c():
+    return # skip for now
+    lines = [
+        ['00\x1faMuhammad Quli Qutb Shah,\x1fcSultan of Golkunda,\x1fd1565-1612.\x1e'],
+        ['00\x1faMuhammad Quli Qutb Shah,\x1fcSultan of Golkunda,\x1fd1565-1612.\x1e'],
+        ['10\x1faMuhammad Quli Qutb Shah, Sultan of Golconda,\x1fd1565-1612\x1e']
+    ]
+    a, b = read_people(lines)
+    assert a == {(('a', u'Muhammad Quli Qutb Shah'), ('c', u'Sultan of Golkunda'), ('d', u'1565-1612')): 3}
+
+def test_same_len_subtag():
+    lines = [
+        ['00\x1faJohn,\x1fcKing of England,\x1fd1167-1216\x1e', '10\x1faShakespeare, William,\x1fd1564-1616\x1fxStage history\x1e'],
+        ['00\x1faJohn,\x1fcKing of England,\x1fd1167-1216\x1fxDrama.\x1e', '10\x1faShakespeare, William,\x1fd1564-1616\x1fxStage history.\x1e'],
+        ['00\x1faJohn\x1fbKing of England,\x1fd1167-1216\x1fxDrama.\x1e', '10\x1faShakespeare, William,\x1fd1564-1616\x1fxStage history.\x1e']
+    ]
+    a, b = read_people(lines)
+    assert a == {
+        (('a', u'John'), ('c', u'King of England'), ('d', u'1167-1216')): 3,
+        (('a', u'Shakespeare, William'), ('d', u'1564-1616')): 3
+    }
+
+def test_king_john():
+    lines = [
+        ['00\x1faJohn,\x1fcKing of England,\x1fd1167-1216\x1fxDrama.\x1e'],
+        ['00\x1faJohn,\x1fcKing of England,\x1fd1167-1216\x1fxDrama\x1e', '10\x1faKean, Charles John,\x1fd1811?-1868\x1e'],
+        ['00\x1faJohn,\x1fcKing of England,\x1fd1167-1216\x1fxDrama\x1e'],
+        ['00\x1faJohn\x1fbKing of England,\x1fd1167-1216\x1fxDrama.\x1e'],
+        ['00\x1faJohn,\x1fcKing of England,\x1fd1167?-1216\x1fxDrama.\x1e'],
+        ['00\x1faJohn\x1fbKing of England,\x1fd1167-1216\x1fxDrama.\x1e'],
+        ['00\x1faJohn\x1fbKing of England,\x1fd1167-1216\x1fxDrama.\x1e'],
+        ['00\x1faJohn,\x1fcKing of England,\x1fd1167-1216\x1fvDrama.\x1e'],
+        ['00\x1faJohn\x1fbKing of England,\x1fd1167-1216\x1fvDrama.\x1e'],
+        ['00\x1faJohn,\x1fcKing of England,\x1fd1167?-1216\x1fxDrama.\x1e'],
+        ['00\x1faJohn,\x1fcKing of England,\x1fd1167?-1216\x1fxDrama.\x1e'],
+        ['00\x1faJohn,\x1fcKing of England,\x1fd1167?-1216\x1fxDrama.\x1e'],
+        ['00\x1faJohn,\x1fcKing of England,\x1fd1167-1216\x1fvDrama\x1e'],
+        ['00\x1faJohn,\x1fcKing of England,\x1fd1167-1216\x1fvDrama.\x1e'],
+        ['00\x1faJohn,\x1fcKing of England,\x1fd1167?-1216\x1fxDrama.\x1e'],
+        ['00\x1faJohn,\x1fcKing of England,\x1fd1167-1216\x1fxDrama.\x1e'],
+        ['00\x1faJohn,\x1fcKing of England,\x1fd1167-1216\x1fxDrama.\x1e'],
+        ['00\x1faJohn,\x1fcKing of England,\x1fd1167-1216\x1fvDrama.\x1e'],
+        ['00\x1faJohn,\x1fcKing of England,\x1fd1167-1216\x1fxDrama.\x1e'],
+        ['00\x1faJohn\x1fbKing of England,\x1fd1167-1216\x1fxDrama.\x1e'],
+        ['00\x1faJohn,\x1fcKing of England,\x1fd1167?-1216\x1fvDrama.\x1e', '00\x1faHenry\x1fbVIII,\x1fcKing of England,\x1fd1491-1547\x1fvDrama.\x1e'],
+        ['00\x1faJohn,\x1fcKing of England,\x1fd1167-1216\x1fvDrama.\x1e'],
+        ['00\x1faJohn,\x1fcKing of England,\x1fd1167-1216\x1fvDrama.\x1e'],
+        ['00\x1faJohn\x1fbKing of England,\x1fd1167-1216\x1fxDrama.\x1e'],
+        ['14\x1faShakespeare, William,\x1fd1564-1616.\x1ftKing John.\x1e'],
+        ['00\x1faJohn,\x1fcKing of England,\x1fd1167-1216\x1fvDrama.\x1e', '10\x1faShakespeare, William,\x1fd1564-1616.\x1ftKing John.\x1e'],
+        ['00\x1faJohn,\x1fcKing of England,\x1fd1167-1216\x1fxDrama\x1e'],
+        ['00\x1faJohn,\x1fcKing of England,\x1fd1167-1216\x1fvDrama.\x1e'],
+        ['00\x1faJohn,\x1fcKing of England,\x1fd1167-1216\x1fxDrama\x1e', '00\x1faHenry\x1fbVIII,\x1fcKing of England,\x1fd1491-1547\x1fxDrama\x1e'],
+        ['00\x1faJohn,\x1fcKing of England,\x1fd1167-1216\x1fxDrama.\x1e'],
+        ['00\x1faJohn,\x1fcKing of England,\x1fd1167?-1216\x1fxDrama.\x1e'],
+        ['00\x1faJohn,\x1fcKing of England,\x1fd1167-1216\x1fxDrama.\x1e', '10\x1faShakespeare, William,\x1fd1564-1616.\x1fxKing John\x1fxProblems, exercises, etc.\x1e', '01\x1faJohn,\x1fcKing of England,\x1fd1167-1216\x1fxDrama.\x1e'],
+        ['00\x1faJohn, $ c King of England,\x1fd1167-1216\x1fxDrama\x1e'],
+        ['00\x1faJohn, $ c King of England,\x1fd1167-1216\x1fxDrama\x1e'],
+        ['00\x1faJohn\x1fbKing of England,\x1fd1167-1216\x1fxDrama.\x1e']
+    ]
+    a, b = read_people(lines)
+    assert a == {
+        (('a', u'Shakespeare, William'), ('d', u'1564-1616')): 3,
+        (('a', u'Kean, Charles John'), ('d', u'1811?-1868')): 1,
+        (('a', u'John'), ('c', u'King of England'), ('d', u'1167?-1216')): 35,
+        (('a', u'Henry'), ('b', u'VIII'),('c', u'King of England'), ('d', u'1491-1547')): 2
+    }
+
+def test_non_ascii():
+    lines = [
+        ['00\x1faA\xe2soka,\x1fcKing of Magadha,\x1fdfl. 259 B.C.\x1e'],
+        ['00\x1faA{acute}soka,\x1fcKing of Magadha\x1fdfl. 259 B.C.\x1e'],
+        ['00\x1faAsoka,\x1fcKing of Magadha,\x1fdfl. 259 B.C..\x1e', '30\x1faMaurya family.\x1e'],
+        ['04\x1faAs\xcc\x81oka,\x1fcKing of Magadha,\x1fdca. 274-232 B.C.\x1e'],
+        ['00\x1faA\xe2soka,\x1fcKing of Magadha,\x1fdfl. 259 B.C.\x1e', '30\x1faMaurya dynasty.\x1e'],
+        ['04\x1faAsoka,\x1fcKing of Magadha,\x1fdca. 274-232 B.C.\x1e'],
+        ['00\x1faA\xe2soka,\x1fcKing of Magadha,\x1fdfl. 259 B.C\x1e', '30\x1faMaurya dynasty\x1e'],
+        ['00\x1faAs\xcc\x81oka,\x1fcKing of Magadha,\x1fdfl. 259 B.C.\x1e', '30\x1faMaurya family.\x1e']
+    ]
+    a, b = read_people(lines)
+    print(a)
+
+def test_q_should_be_c():
+    lines = [
+        ['10\x1faLafayette, Marie Joseph Paul Yves Roch Gilbert Du Motier,\x1fcmarquis de,\x1fd1757-1834\x1fxTravel\x1fzNew York (State)\x1fzNew York.\x1e'],
+        ['10\x1faLafayette, Marie Joseph Paul Yves Roch Gilbert Du Motier,\x1fcmarquis de,\x1fd1757-1834\x1fxTravel\x1fzNew York (State)\x1fzNew York.\x1e'],
+        ['10\x1faLafayette, Marie Joseph Paul Yves Roch Gilbert Du Motier,\x1fqmarquis de,\x1fd1757-1834.\x1e']
+    ]
+    a, b = read_people(lines)
+
+def test_date_in_a():
+    lines = [
+        ['10\x1faMachiavelli, Niccol\xe1o,\x1fd1469-1527\x1fxFiction.\x1e', '10\x1faBorgia, Cesare,\x1fd1476?-1507\x1fxFiction.\x1e'],
+        [' 0\x1faBorgia, Cesare, 1476?-1507\x1fxFiction.\x1e', ' 0\x1faMachiavelli, Niccolo, 1469-1527\x1fxFiction.\x1e'],
+        ['10\x1faMachiavelli, Niccol\xe1o,\x1fd1469-1527\x1fxFiction.\x1e', '10\x1faBorgia, Cesare,\x1fd1476?-1507\x1fxFiction.\x1e'],
+        ['10\x1faMachiavelli, Niccol\xe1o,\x1fd1469-1527\x1fxFiction.\x1e', '10\x1faBorgia, Cesare,\x1fd1476?-1507\x1fxFiction.\x1e'], ['10\x1faMachiavelli, Niccol\xe1o,\x1fd1469-1527\x1fxFiction.\x1e', '10\x1faBorgia, Cesare,\x1fd1476?-1507\x1fxFiction.\x1e'], ['10\x1faMachiavelli, Niccol\xe1o,\x1fd1469-1527\x1fxFiction\x1e', '10\x1faBorgia, Cesare,\x1fd1476?-1507\x1fxFiction\x1e'],
+        ['10\x1faMachiavelli, Niccol\xe1o,\x1fd1469-1527\x1fxFiction.\x1e', '10\x1faBorgia, Cesare,\x1fd1476?-1507\x1fxFiction.\x1e']
+    ]
+    a, b = read_people(lines)
+    print(a)
+    assert a == {(('a', u'Borgia, Cesare'), ('d', u'1476?-1507')): 7, (('a', u'Machiavelli, Niccol\xf2'), ('d', u'1469-1527')): 7}
+
+def test_king_asoka():
+    return
+    lines = [
+        ['00\x1faA\xe2soka,\x1fcKing of Magadha,\x1fdfl. 259 B.C.\x1e'],
+        ['00\x1faA{acute}soka,\x1fcKing of Magadha\x1fdfl. 259 B.C.\x1e'],
+        ['00\x1faAsoka,\x1fcKing of Magadha,\x1fdfl. 259 B.C..\x1e', '30\x1faMaurya family.\x1e'],
+        ['04\x1faAs\xcc\x81oka,\x1fcKing of Magadha,\x1fdca. 274-232 B.C.\x1e'],
+        ['00\x1faA\xe2soka,\x1fcKing of Magadha,\x1fdfl. 259 B.C.\x1e', '30\x1faMaurya dynasty.\x1e'],
+        ['04\x1faAsoka,\x1fcKing of Magadha,\x1fdca. 274-232 B.C.\x1e'],
+        ['00\x1faA\xe2soka,\x1fcKing of Magadha,\x1fdfl. 259 B.C\x1e', '30\x1faMaurya dynasty\x1e'],
+        ['00\x1faAs\xcc\x81oka,\x1fcKing of Magadha,\x1fdfl. 259 B.C.\x1e', '30\x1faMaurya family.\x1e']
+    ]
+    a, b = read_people(lines)
+    print(a)
+    # (('a', u'Asoka'), ('c', u'King of Magadha'), ('d', u'fl. 259 B.C..')): 1
+    assert a == {
+        (('a', u'A\u015boka'), ('c', u'King of Magadha'), ('d', u'fl. 259 B.C.')): 7,
+        (('a', u'Maurya dynasty'),): 2,
+        (('a', u'Maurya family'),): 2,
+        (('a', u'Asoka'), ('c', u'King of Magadha'), ('d', u'ca. 274-232 B.C.')): 1
+    }
+
+def test_name_lookup():
+    lines = [
+        ['10\x1faBellini, Giovanni,\x1fd1516.\x1e'],
+        ['10\x1faBellini, Giovanni,\x1fdd. 1516\x1e']
+    ]
+    a, b = read_people(lines)
+    assert a == {(('a', 'Bellini, Giovanni'), ('d', 'd. 1516')): 2}
+    assert b == {((u'a', u'Bellini, Giovanni'), (u'd', u'1516')): ((u'a', u'Bellini, Giovanni'), (u'd', u'd. 1516'))}
+
+def test_cleopatra():
+    return
+    lines = [
+        ['00\x1faCleopatra,\x1fcQueen of Egypt,\x1fdd. 30 B.C\x1fxFiction.\x1e'],
+        ['00\x1faCleopatra,\x1fcQueen of Egypt,\x1fdd. 30 B.C.\x1fxFiction\x1e'],
+        [' 0\x1faCleopatra, Queen of Egypt, d. 30 B.C.\x1fxFiction.\x1e'],
+        ['00\x1faCleopatra,\x1fcQueen of Egypt,\x1fdd. 30 B.C.\x1fxFiction\x1e'],
+        ['00\x1faCleopatra,\x1fcqueen of Egypt,\x1fdd. B.C. 30\x1fxFiction\x1e'],
+        ['00\x1faCleopatra,\x1fcQueen of Egypt,\x1fdd. 30 B.C.\x1fxFiction\x1e'],
+        ['00\x1faCleopatra,\x1fcQueen of Egypt,\x1fdd. 30 B.C.\x1fvFiction.\x1e'],
+        ['00\x1faCleopatra,\x1fcQueen of Egypt,\x1fdd. 30 B.C.\x1fxFiction.\x1e']
+    ]
+    a, b = read_people(lines)
+    assert a == {
+        (('a', u'Cleopatra'), ('c', u'Queen of Egypt'), ('d', u'd. 30 B.C.')): 8,
+    }
+
+def test_date_field_missing():
+    lines = [[' 0\x1faMoore, Henry Spencer, 1898-\x1e']]
+    a, b = read_people(lines)
+    assert a == {
+        (('a', u'Moore, Henry Spencer'), ('d', u'1898-')): 1
+    }
+    assert b == {}
+
+def test_numbers_in_name():
+    lines = [
+        [' 0\x1faFielding, Henry, 1707-1754.  The history of the adventures of Joseph Andrews.\x1e'],
+        ['14\x1faFielding, Henry,\x1fd1707-1754.\x1ftJoseph Andrews.\x1e'],
+        ['10\x1faFielding, Henry,\x1fd1707-1754.\x1ftHistory of the adventures of Joseph Andrews.\x1e'],
+        ['14\x1faFielding, Henry,\x1fd1707-1754.\x1ftJoseph Andrews.\x1e'],
+        ['10\x1faFielding, Henry,\x1fd1707-1754.\x1ftHistory of the adventures of Joseph Andrews.\x1e'],
+        ['10\x1faFielding, Henry,\x1fd1707-1754.\x1ftHistory of the adventures of Joseph Andrews.\x1e'],
+        ['10\x1faFielding, Henry,\x1fd1707-1754.\x1ftHistory of the adventures of Joseph Andrews\x1e']
+    ]
+    a, b = read_people(lines)
+    assert a == {
+        (('a', u'Fielding, Henry'), ('d', u'1707-1754')): 7
+    }
+
+def test_caesar():
+    lines = [
+        ['10\x1faCaesar, Julius.\x1e'],
+        ['14\x1faCaesar, Julius,\x1fd100 B.C.-44B.C.\x1e'],
+        ['14\x1faCaesar, Julius,\x1fd100 B.C.-44 B.C.\x1e'],
+        ['10\x1faCaesar, Julius\x1e'],
+        ['14\x1faCaesar, Julius,\x1fd100 B.C.-44 B.C.\x1e']
+    ]
+    a, b = read_people(lines)
+    assert a == {(('a', 'Caesar, Julius'), ('d', '100 B.C.-44 B.C.')): 5}
+
+def test_salvador_dali():
+    lines = [
+        ['14\x1faDali\xcc\x81, Salvador,\x1fd1904-1989\x1fvCatalogs.\x1e'],
+        ['10\x1faDali, Salvador,\x1fd1904-\x1e'],
+        ['10\x1faDal\xe2i, Salvador,\x1fd1904-\x1e'],
+        ['10\x1faDal\xe2i, Salvador,\x1fd1904-\x1e'],
+        ['10\x1faDal\xe2i, Salvador,\x1fd1904-\x1fxCatalogs.\x1e', '10\x1faMorse, Albert Reynolds,\x1fd1914-\x1fxArt collections\x1fxCatalogs.\x1e'],
+        ['10\x1faDal\xe2i, Salvador\x1fy1904-\x1e'],
+        ['14\x1faDali\xcc\x81, Salvador,\x1fd1904- \x1fvexhibitions.\x1e'],
+        ['14\x1faDali\xcc\x81, Salvador,\x1fd1904- \x1fvexhibitions.\x1e']
+    ]
+    a, b = read_people(lines)
+    assert a == {
+        ((u'a', u'Dal\xed, Salvador'), (u'd', u'1904-1989')): 8,
+        ((u'a', u'Morse, Albert Reynolds'), (u'd', u'1914-')): 1
+    }
+
+def test_date_in_y():
+    lines = [
+        ['10\x1faShakespeare, William,\x1fd1564-1616\x1fxStage history\x1fy1800-1950.\x1e'],
+        ['10\x1faShakespeare, William,\x1fd1564-1616\x1fxStage history\x1fy1800-\x1e'],
+        ['10\x1faShakespeare, William,\x1fd1564-1616.\x1e'],
+        ['10\x1faShakespeare, William,\x1fd1564-1616\x1fxDramatic production\x1e']
+    ]
+    a, b = read_people(lines)
+    assert a == {((u'a', u'Shakespeare, William'), (u'd', u'1564-1616')): 4}
+
+def test_subtags_swapped():
+    lines = [
+        ['20\x1faCompton-Burnett, I.\x1fq(Ivy),\x1fd1884-1969.\x1e'],
+        ['10\x1faCompton-Burnett, I.\x1fd(Ivy),\x1fq1884-1969\x1fxCriticism and interpretation.\x1e'],
+        ['20\x1faCompton-Burnett, I.\x1fq(Ivy),\x1fd1884-1969.\x1e'],
+        ['14\x1faCompton-Burnett, I.\x1fq(Ivy),\x1fd1884-1969.\x1e'],
+        ['20\x1faCompton-Burnett, I.\x1fq(Ivy),\x1fd1884-1969\x1fxCriticism and interpretation.\x1e'],
+        ['20\x1faCompton-Burnett, I.\x1fq(Ivy),\x1fd1884-1969\x1fxCriticism and interpretation.\x1e'],
+        ['20\x1faCompton-Burnett, I.\x1fq(Ivy),\x1fd1884-1969\x1fxCriticism and interpretation.\x1e'],
+        ['14\x1faCompton-Burnett, I.\x1fq(Ivy),\x1fd1884-1969.\x1e']
+    ]
+    a, b = read_people(lines)
+    assert a == {((u'a', u'Compton-Burnett, I.'), (u'q', u'(Ivy),'), (u'd', u'1884-1969')): 8}
+
+def test():
+    lines = [
+        [
+            '10\x1faWashington, George,\x1fd1732-1799\x1fxFamily\x1fvJuvenile fiction.\x1e',
+            '10\x1faJudge, Oney\x1fvJuvenile fiction.\x1e',
+            '11\x1faWashington, George,\x1fd1732-1799\x1fxFamily\x1fxFiction.\x1e',
+            '11\x1faJudge, Oney\x1fvFiction.\x1e'
+        ], [
+            '10\x1faJudge, Oney\x1fvJuvenile fiction.\x1e',
+            '10\x1faWashington, George,\x1fd1732-1799\x1fxFamily\x1fvJuvenile fiction.\x1e',
+            '11\x1faJudge, Oney\x1fvFiction.\x1e',
+            '11\x1faWashington, George,\x1fc1732-1799\x1fxFamily\x1fvFiction.\x1e'
+        ]
+    ]
+
+    a, b = read_people(lines)
+    assert a == {((u'a', u'Judge, Oney'),): 4, ((u'a', u'Washington, George'), (u'd', u'1732-1799')): 4}
+
+#    lines = [
+#        [' 0\x1faHadrian, Emperor of Rome, 76-138\x1fxFiction.\x1e'],
+#        ['00\x1faHadrianus,\x1fcEmperor of Rome,\x1fd76-138\x1fxFiction.\x1e']
+#    ]
+#    lines = [[' 0\x1faGreene, Graham, 1904- .  The basement room. 1971.\x1e']]
+
+#    lines = [
+#        [' 0\x1faGyllembourg-Ehrensvard, Thomasine Christine Buntzen, 1773-1856. To tidsaldre.\x1e'],
+#        ['10\x1faGyllembourg, Thomasine,\x1fd1773-1856.\x1ftTo tidsaldre.\x1e'],
+#        ['14\x1faGyllembourg-Ehrensva\xcc\x88rd, Thomasine.\x1ftTo tidsaldre.\x1e']
+#    ]
+
+#    lines = [['10\x1faClifford, Henry de Clifford, 14th lord,\x1fd1455?-1523\x1fxFiction.\x1e',]]
+
+def test_same_name_different_dates():
+    lines = [
+        ['10\x1faStrauss, Johann,\x1fd1825-1899.\x1e', '10\x1faStrauss, Johann,\x1fd1804-1849.\x1e'],
+        ['10\x1faStrauss, Johann,\x1fd1825-1899.\x1e', '10\x1faStrauss, Johann,\x1fd1804-1849.\x1e'],
+        ['10\x1faStrauss, Johann,\x1fd1825-1899.\x1e', '10\x1faStrauss, Johann,\x1fd1804-1849.\x1e']
+    ]
+    a, b = read_people(lines)
+    assert a == {
+        ((u'a', u'Strauss, Johann'), (u'd', u'1804-1849')): 3,
+        ((u'a', u'Strauss, Johann'), (u'd', u'1825-1899')): 3
+    }
+
+def test_king_richard_iii():
+    lines = [
+        ['00\x1faRichard\x1fbIII,\x1fcKing of England,\x1fd1452-1485\x1fvDrama.\x1e'],
+        ['00\x1faRichard\x1fbIII,\x1fcKing of England,\x1fd1425-1485\x1fvDrama.\x1e'],
+        ['00\x1faRichard\x1fbIII,\x1fcKing of England,\x1fd1452-1485\x1fvDrama.\x1e'],
+        ['00\x1faRichard\x1fbIII,\x1fcKing of England,\x1fd1452-1485\x1fvDrama.\x1e'],
+        ['00\x1faRichard\x1fbIII,\x1fcKing of England,\x1fd1452-1485\x1fvDrama.\x1e'],
+        ['10\x1faShakespeare, William,\x1fd1564-1616.\x1ftKing Richard III.\x1e', '00\x1faRichard\x1fbIII,\x1fcKing of England,\x1fd1452-1485\x1fvDrama.\x1e'],
+        ['00\x1faRichard\x1fbIII,\x1fcKing of England,\x1fd1452-1485\x1fxDrama\x1e'],
+        ['00\x1faRichard\x1fbIII,\x1fcKing of England,\x1fd1452-1485\x1fvDrama.\x1e'],
+        ['00\x1faRichard\x1fbIII,\x1fcKing of England,\x1fd1452-1485\x1fxDrama\x1e'],
+        ['04\x1faRichard\x1fbIII,\x1fcKing of England\x1fxDrama.\x1e'],
+        ['00\x1faRichard\x1fbIII,\x1fcKing of England,\x1fd1452-1485\x1fxDrama.\x1e'],
+        ['00\x1faRichard\x1fbIII,\x1fcKing of England,\x1fd1452-1485\x1fxDrama\x1e'],
+        ['10\x1faRichard\x1fbIII,\x1fcKing of England,\x1fd1452-1485\x1fxDrama.\x1e'],
+        ['00\x1faRichard\x1fbIII,\x1fcKing of England,\x1fd1452-1485\x1fvDrama.\x1e']
+    ]
+    a, b = read_people(lines)
+    assert a == {
+        ((u'a', u'Richard'), (u'b', u'III'), (u'c', u'King of England'), (u'd', u'1452-1485')): 14,
+        ((u'a', u'Shakespeare, William'), (u'd', u'1564-1616')): 1
+    }
+
+def test_churchill_family():
+    lines = [
+        ['30\x1faChurchill family\x1e'],
+        ['30\x1faChurchill family.\x1e'],
+        ['34\x1faChurchill,\x1fcfamily.\x1e'],
+        ['30\x1faChurchill family\x1e'],
+        ['34\x1faChurchill,\x1fcFamily.\x1e']
+    ]
+    a, b = read_people(lines)
+    assert a == { (('a', 'Churchill family'),): 5}
+
+def test_william_thompson():
+    lines = [
+        ['10\x1faHodgskin, Thomas,\x1fd1787-1869.\x1e', '10\x1faThompson, William,\x1fd1785?-1833.\x1e'],
+        ['10\x1faHodgskin, Thomas,\x1fd1787-1869.\x1e', '10\x1faThompson, William,\x1fd1775-1833.\x1e'],
+        ['10\x1faHodgskin, Thomas,\x1fd1787-1869.\x1e', '10\x1faThompson, William,\x1fd1775-1833.\x1e']
+    ]
+    a, b = read_people(lines)
+    assert a == { # better if we could merge the William Thompson subjects
+        ((u'a', u'Hodgskin, Thomas'), (u'd', u'1787-1869')): 3,
+        ((u'a', u'Thompson, William'), (u'd', u'1775-1833')): 2,
+        ((u'a', u'Thompson, William'), (u'd', u'1785?-1833')): 1
+    }
+
+def test_marcus_porcius():
+    lines = [
+        ['10\x1faCato, Marcus Porcius,\x1fd95-46 B.C.\x1fxDrama.\x1e'],
+        ['10\x1faCato, Marcus Porcius,\x1fd95-46 B.C.\x1fxDrama\x1e'],
+        ['10\x1faCato, Marcus Porcius,\x1fd95-46 B.C.\x1fxDrama.\x1e'],
+        ['10\x1faCato, Marcus Porcius,\x1fd95-46 B.C.\x1fxDrama.\x1e'],
+        ['10\x1faCato, Marcus Porcius,\x1fd95-46 B.C.\x1fvDrama.\x1e'],
+        ['10\x1faCato, Marcus Porcius,\x1fd234-149 B.C.\x1fvDrama.\x1e'],
+        ['10\x1faCato, Marcus Porcius,\x1fd95-46 B.C.\x1fxDrama\x1fxEarly works to 1800\x1e']
+    ]
+    a, b = read_people(lines)
+    assert a == {
+        ((u'a', u'Cato, Marcus Porcius'), (u'd', u'234-149 B.C.')): 1,
+        ((u'a', u'Cato, Marcus Porcius'), (u'd', u'95-46 B.C.')): 6
+    }
diff --git a/ia-legacy-importer/read_rc.py b/ia-legacy-importer/read_rc.py
new file mode 100644
index 00000000..14e69bb8
--- /dev/null
+++ b/ia-legacy-importer/read_rc.py
@@ -0,0 +1,16 @@
+import os.path
+
+# ~/.olrc looks like this:
+#
+# db=''
+# user=''
+# pw= ''
+# host = ''
+# secret_key = ''
+
+def read_rc():
+    rc_file = os.path.expanduser('~/.olrc')
+    if not os.path.exists(rc_file):
+        return {}
+    f = open(rc_file)
+    return eval('dict(' + ', '.join(i for i in f if i) + ')')
diff --git a/ia-legacy-importer/scratch/add_source_records.py b/ia-legacy-importer/scratch/add_source_records.py
new file mode 100644
index 00000000..667be4dd
--- /dev/null
+++ b/ia-legacy-importer/scratch/add_source_records.py
@@ -0,0 +1,41 @@
+from __future__ import print_function
+import os
+import re
+import sys
+import codecs
+from openlibrary.catalog.read_rc import read_rc
+from openlibrary.catalog.importer.db_read import get_mc
+
+sys.path.append('/home/edward/src/olapi')
+from olapi import OpenLibrary, unmarshal, marshal
+
+rc = read_rc()
+ol = OpenLibrary("http://dev.openlibrary.org")
+ol.login('EdwardBot', rc['EdwardBot'])
+
+test_dir = '/home/edward/ol/test_data'
+
+re_edition = re.compile('^/b/OL\d+M$')
+
+re_meta_mrc = re.compile('^([^/]*)_meta.mrc:0:\d+$')
+
+for f in os.listdir(test_dir):
+    key = f.replace('_', '/')
+    if not re_edition.match(key):
+        continue
+    print(key)
+    continue
+    mc = get_mc(key)
+    print(key, mc)
+    if not mc:
+        continue
+    e = ol.get(key)
+    if e.get('source_records', []):
+        continue
+    if mc.startswith('ia:') or mc.startswith('amazon:'):
+        sr = mc
+    else:
+        m = re_meta_mrc.match(mc)
+        sr = 'marc:' + mc if not m else 'ia:' + m.group(1)
+    e['source_records'] = [sr]
+    print(ol.save(key, e, 'add source record'))
diff --git a/ia-legacy-importer/scratch/count_41.py b/ia-legacy-importer/scratch/count_41.py
new file mode 100644
index 00000000..be889d67
--- /dev/null
+++ b/ia-legacy-importer/scratch/count_41.py
@@ -0,0 +1,85 @@
+from __future__ import print_function
+import web
+import os.path
+from catalog.get_ia import read_marc_file
+from catalog.read_rc import read_rc
+from catalog.marc.fast_parse import get_first_tag, get_all_subfields
+from catalog.utils.query import query_iter
+
+marc_index = web.database(dbn='postgres', db='marc_index')
+marc_index.printing = False
+
+rc = read_rc()
+
+def get_keys(loc):
+    assert loc.startswith('marc:')
+    vars = {'loc': loc[5:]}
+    db_iter = marc_index.query('select k from machine_comment where v=$loc', vars)
+    mc = list(db_iter)
+    if mc:
+        return [r.k for r in mc]
+    iter = query_iter({'type': '/type/edition', 'source_records': loc})
+    return [e['key'] for e in iter]
+
+def files():
+    endings = ['.mrc', '.marc', '.out', '.dat', '.records.utf8']
+    def good(filename):
+        return any(filename.endswith(e) for e in endings)
+
+    dir = rc['marc_path']
+    dir_len = len(dir) + 1
+    for dirpath, dirnames, filenames in os.walk(dir):
+        for f in sorted(f for f in filenames if good(f)):
+            name = dirpath + "/" + f
+            yield name, name[dir_len:], os.path.getsize(name)
+
+def percent(a, b):
+    return "%.2f%%" % (float(a * 100.0) / b)
+
+chunk = 10000
+
+books = 0
+has_041 = 0
+has_a = 0
+has_h = 0
+has_2 = 0
+i2 = 0
+i1_0 = 0
+i1_1 = 0
+for name, part, size in files():
+    f = open(name)
+    print(part)
+    for pos, loc, data in read_marc_file(part, f):
+        if str(data)[6:8] != 'am': # only want books
+            continue
+        books += 1
+        line = get_first_tag(data, set(['041']))
+        if not line:
+            continue
+        has_041 += 1
+        if line[0] == '0':
+            i1_0 += 1
+        if line[0] == '1':
+            i1_1 += 1
+        subfields = list(get_all_subfields(line))
+        print(loc)
+        keys = get_keys(loc)
+        print(keys, line[0:2], subfields)
+        continue
+        if line[1] != ' ':
+            i2 += 1
+            print('i2:', line[0:2], subfields)
+        if '\x1fa' in line:
+            has_a +=1
+        else:
+            print('no a:', line[0:2], subfields)
+        if '\x1fh' in line:
+            has_h +=1
+        if '\x1f2' in line:
+            has_2 +=1
+            print('has 2:', line[0:2], subfields)
+        if has_041 % chunk == 0:
+            print(books, percent(has_041, books), percent(i1_0, has_041), \
+                percent(i1_1, has_041), i2, percent(has_a, has_041), \
+                percent(has_h, has_041), has_2)
+#        print total, line[0:2], list(get_all_subfields(line))
diff --git a/ia-legacy-importer/scratch/get_651.py b/ia-legacy-importer/scratch/get_651.py
new file mode 100644
index 00000000..6e2275c2
--- /dev/null
+++ b/ia-legacy-importer/scratch/get_651.py
@@ -0,0 +1,34 @@
+from catalog.importer.db_read import get_mc, withKey
+from catalog.get_ia import get_from_local
+from catalog.marc.fast_parse import get_tag_lines, get_all_subfields
+import sys
+import web
+import simplejson as json
+
+def get_src(key):
+    e = withKey(key)
+    if 'source_records' in e:
+        return e['source_records']
+    src = get_mc(key)
+    if src:
+        return [src]
+
+def get_651(key):
+    found = []
+    for src in get_src(key):
+        data = get_from_local(src)
+        for tag, line in get_tag_lines(data, ['651']):
+            found.append(list(get_all_subfields(line)))
+    return found
+
+urls = (
+    '^(/b/OL\d+M)$', 'lookup'
+)
+app = web.application(urls, globals())
+
+class lookup:
+    def GET(self, key):
+        return json.dumps(get_651(key))
+
+if __name__ == "__main__":
+    app.run()
diff --git a/ia-legacy-importer/scratch/remove_subject_period.py b/ia-legacy-importer/scratch/remove_subject_period.py
new file mode 100644
index 00000000..09c583a0
--- /dev/null
+++ b/ia-legacy-importer/scratch/remove_subject_period.py
@@ -0,0 +1,54 @@
+from __future__ import print_function
+from catalog.utils.query import query_iter, set_staging, withKey
+import sys
+import codecs
+import re
+sys.path.append('/home/edward/src/olapi')
+from olapi import OpenLibrary, Reference
+from catalog.read_rc import read_rc
+
+import six
+
+
+rc = read_rc()
+
+sys.stdout = codecs.getwriter('utf-8')(sys.stdout)
+set_staging(True)
+
+ol = OpenLibrary("http://dev.openlibrary.org")
+ol.login('EdwardBot', rc['EdwardBot'])
+
+re_skip = re.compile('\b([A-Z]|Co|Dr|Jr|Capt|Mr|Mrs|Ms|Prof|Rev|Revd|Hon)\.$')
+
+def has_dot(s):
+    return s.endswith('.') and not re_skip.search(s)
+
+q = { 'type': '/type/edition', 'table_of_contents': None, 'subjects': None }
+queue = []
+count = 0
+for e in query_iter(q):
+    if not e.get('subjects', None) or not any(has_dot(s) for s in e['subjects']):
+        continue
+    subjects = [s[:-1] if has_dot(s) else s for s in e['subjects']]
+    q = {
+        'key': e['key'],
+        'subjects': {'connect': 'update_list', 'value': subjects },
+    }
+    # need to fix table_of_contents to pass validation
+    toc = e['table_of_contents']
+    if toc and (isinstance(toc[0], six.string_types) or toc[0]['type'] == '/type/text'):
+        if isinstance(toc[0], six.string_types):
+            assert all(isinstance(i, six.string_types) for i in toc)
+            new_toc = [{'title': i, 'type': '/type/toc_item'} for i in toc]
+        else:
+            assert all(i['type'] == '/type/text' for i in toc)
+            new_toc = [{'title': i['value'], 'type': '/type/toc_item'} for i in toc]
+        q['table_of_contents'] = {'connect': 'update_list', 'value': new_toc }
+    queue.append(q)
+    count += 1
+    if len(queue) == 100:
+        print(count, 'writing to db')
+        print(ol.write(queue, "remove trailing period from subjects"))
+        queue = []
+
+print(ol.write(queue, "remove trailing period from subjects"))
diff --git a/ia-legacy-importer/scratch/work_author_role.py b/ia-legacy-importer/scratch/work_author_role.py
new file mode 100644
index 00000000..696d6851
--- /dev/null
+++ b/ia-legacy-importer/scratch/work_author_role.py
@@ -0,0 +1,55 @@
+from __future__ import print_function
+import sys
+import codecs
+from openlibrary.catalog.utils.query import query_iter, set_staging, query
+from openlibrary.api import OpenLibrary, Reference
+from openlibrary.catalog.read_rc import read_rc
+from time import sleep
+
+set_staging(True)
+rc = read_rc()
+
+ol = OpenLibrary("http://dev.openlibrary.org")
+ol.login('EdwardBot', rc['EdwardBot'])
+sys.stdout = codecs.getwriter('utf-8')(sys.stdout)
+
+work_q = {
+    'type': '/type/work',
+    'authors': None,
+    'title': None,
+}
+
+queue = []
+
+for w in query_iter(work_q):
+    if not w.get('authors'):
+        print('no authors')
+        continue
+    if any(isinstance(a, dict) and 'author' in a for a in w['authors']):
+        continue
+    print(len(queue), w['key'], w['title']) # , ol.get(w['authors'][0]['key'])['name']
+    full = ol.get(w['key'])
+    authors = full['authors']
+    assert all(isinstance(a, Reference) for a in authors)
+    full['authors'] = [{'author':a} for a in authors]
+    queue.append(full)
+    if len(queue) > 1000:
+        print('saving')
+        print(ol.save_many(queue, 'update format of authors in works to provide roles'))
+        queue = []
+        print('two second pause')
+        sleep(2)
+    continue
+    work_e = {
+        'type': '/type/edition',
+        'works': w['key'],
+        'by_statement': None,
+    }
+    for e in query_iter(work_e):
+        by = e['by_statement']
+        if by:
+            print('  ', e['key'], by)
+
+print('saving')
+print(ol.save_many(queue, 'update format of authors in works to provide roles'))
+
diff --git a/ia-legacy-importer/solr/solr.py b/ia-legacy-importer/solr/solr.py
new file mode 100755
index 00000000..d2cda9f8
--- /dev/null
+++ b/ia-legacy-importer/solr/solr.py
@@ -0,0 +1,41 @@
+#!/usr/bin/python
+
+from __future__ import print_function
+from time import sleep, time
+import web
+import subprocess
+import sys
+from catalog.read_rc import read_rc
+
+from six.moves import urllib
+
+
+rc = read_rc()
+
+def solr_query(q, start=0, rows=None, sort_by="publicdate desc"):
+    q += " AND NOT collection:test_collection AND NOT collection:opensource AND NOT collection:microfilm"
+#    q += " AND NOT collection:test_collection AND collection:gutenberg"
+    url = rc['solr_url'] + "?q=%s;%s&wt=json&start=%d" % (urllib.parse.quote(q), urllib.parse.quote_plus(sort_by), start)
+    if rows:
+        url += "&rows=%d" % rows
+    ret = eval(urllib.request.urlopen(url).read())
+    return ret['response']
+
+def get_books(**args):
+    ret = solr_query("mediatype:texts AND format:scandata", **args)
+    #ret = solr_query("mediatype:texts", **args)
+    return [d['identifier'] for d in ret['docs']]
+
+if __name__ == '__main__':
+    rows = 1000
+    out = open(sys.argv[1], 'w')
+    for i in range(20):
+        print(i)
+        books = list(get_books(rows=rows, start=i * rows))
+        if not books:
+            break
+        for b in books:
+            print(b, file=out)
+    out.close()
+
+    print("finished")
diff --git a/ia-legacy-importer/talis/isbn_and_author_date.py b/ia-legacy-importer/talis/isbn_and_author_date.py
new file mode 100644
index 00000000..de324bdb
--- /dev/null
+++ b/ia-legacy-importer/talis/isbn_and_author_date.py
@@ -0,0 +1,67 @@
+from __future__ import print_function
+# read Talis, find books with ISBN and author date, add date to author
+
+from catalog.read_rc import read_rc
+from catalog.marc.fast_parse import *
+from catalog.infostore import get_site
+from catalog.merge.names import match_name
+from catalog.marc.build_record import read_author_person
+
+import re
+
+site = get_site()
+
+re_author_date_subfield = re.compile('\x1f[az]')
+re_isbn_subfield = re.compile('\x1f[az]')
+
+rc = read_rc()
+filename = rc['marc_path'] + 'talis_openlibrary_contribution/talis-openlibrary-contribution.mrc'
+
+seen = set()
+
+def build_fields(data):
+    fields = {}
+    for tag, line in get_tag_lines(data, ['020', '100']):
+        if tag in fields:
+            return {}
+        fields[tag] = line
+    if '020' not in fields or '100' not in fields:
+        return {}
+    if fields['100'].find('\x1fd') == -1:
+        return {}
+    if not re_isbn_subfield.search(fields['020']):
+        return {}
+    return fields
+
+def find_authors(isbn_list, name):
+    edition_keys = []
+    for isbn in isbn_list:
+        edition_keys.extend(site.things({'type': '/type/edition', 'isbn_10': isbn}))
+    authors = set()
+    for k in edition_keys:
+        t = site.withKey(k)
+        if t.authors:
+            authors.update(t.authors)
+    for a in authors:
+        if not match_name(a.name, name, last_name_only_ok=False):
+            continue
+        books = site.things({'type': '/type/edition', 'authors': a.key})
+        print(repr(a.key, a.name, a.birth_date, a.death_date, len(books)))
+
+for data, length in read_file(open(filename)):
+    fields = build_fields(data)
+    if not fields:
+        continue
+    isbn_list = read_isbn(fields['020'])
+    if not isbn_list:
+        continue
+
+    if any(isbn in seen for isbn in isbn_list):
+        continue
+    seen.update(isbn_list)
+    person = read_author_person(fields['100'])
+    print(list(get_all_subfields(fields['100'])))
+    print(person)
+    print(isbn_list)
+    find_authors(isbn_list, person['personal_name'])
+#        fields.append(tag, list(get_all_subfields(line)))
diff --git a/ia-legacy-importer/title_page_img/__init__.py b/ia-legacy-importer/title_page_img/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/ia-legacy-importer/title_page_img/load.py b/ia-legacy-importer/title_page_img/load.py
new file mode 100644
index 00000000..4f612da4
--- /dev/null
+++ b/ia-legacy-importer/title_page_img/load.py
@@ -0,0 +1,31 @@
+from openlibrary.catalog.read_rc import read_rc
+import httplib
+import json
+
+from six.moves import urllib
+
+
+rc = read_rc()
+
+def add_cover_image(ekey, ia):
+    h1 = httplib.HTTPConnection('openlibrary.org')
+    body = json.dumps(dict(username='ImportBot', password=rc['ImportBot']))
+    headers = {'Content-Type': 'application/json'}
+    h1.request('POST', 'http://openlibrary.org/account/login', body, headers)
+
+    res = h1.getresponse()
+
+    res.read()
+    assert res.status == 200
+    cookies = res.getheader('set-cookie').split(',')
+    cookie =  ';'.join([c.split(';')[0] for c in cookies])
+
+    cover_url = 'http://www.archive.org/download/' + ia + '/page/' + ia + '_preview.jpg'
+    body = urllib.parse.urlencode({"url": cover_url})
+    assert ekey.startswith('/books/')
+    add_cover_url = 'http://openlibrary.org' + ekey + '/add-cover.json'
+    headers = {'Content-type': 'application/x-www-form-urlencoded', 'Cookie': cookie}
+    h1.request('POST', add_cover_url, body, headers)
+    res = h1.getresponse()
+    res.read()
+    return
diff --git a/ia-legacy-importer/title_page_img/replace_cover_with_title.py b/ia-legacy-importer/title_page_img/replace_cover_with_title.py
new file mode 100644
index 00000000..9c5b6ace
--- /dev/null
+++ b/ia-legacy-importer/title_page_img/replace_cover_with_title.py
@@ -0,0 +1,248 @@
+from __future__ import print_function
+from openlibrary.utils.ia import find_item
+from openlibrary.catalog.read_rc import read_rc
+from openlibrary.catalog.utils.query import query, withKey, has_cover
+from subprocess import Popen, PIPE
+import web
+import re
+import sys
+import xml.etree.ElementTree as et
+import xml.parsers.expat
+import socket  # for exceptions
+import httplib
+from time import sleep
+
+from six.moves import urllib
+
+
+re_single_cover = re.compile('^\[(\d+)\]$')
+re_remove_xmlns = re.compile(' xmlns="[^"]+"')
+
+fh_log = open('/1/edward/logs/covers2', 'a')
+
+def write_log(ol, ia, url):
+    print((ol, ia, url), file=fh_log)
+    fh_log.flush()
+
+def parse_scandata_xml(f):
+    xml = f.read()
+    xml = re_remove_xmlns.sub('', xml)
+    #tree = et.parse(f)
+    tree = et.fromstring(xml)
+    leaf = None
+    leafNum = None
+    cover = None
+    title = None
+    for e in tree.find('pageData'):
+        assert e.tag == 'page'
+        leaf = int(e.attrib['leafNum'])
+        if leaf > 25: # enough
+            break
+        page_type = e.findtext('pageType')
+        if page_type == 'Cover':
+            cover = leaf
+        elif page_type == 'Title Page' or page_type == 'Title':
+            title = leaf
+            break
+    return (cover, title)
+
+def find_title_leaf_et(ia_host, ia_path, url):
+    f = urllib.request.urlopen(url)
+    try:
+        return parse_scandata_xml(f)
+    except xml.parsers.expat.ExpatError:
+        print(url)
+        return (None, None)
+
+def jp2_zip_test(ia_host, ia_path, ia):
+    conn = httplib.HTTPConnection(ia_host)
+    conn.request('HEAD', ia_path + "/" + ia + "_jp2.zip")
+    r1 = conn.getresponse()
+    try:
+        assert r1.status in (200, 403, 404)
+    except AssertionError:
+        print(r1.status, r1.reason)
+        raise
+    return r1.status
+
+def scandata_url(ia_host, ia_path, item_id):
+    conn = httplib.HTTPConnection(ia_host)
+    conn.request('HEAD', ia_path + "/scandata.zip")
+    r = conn.getresponse()
+    try:
+        assert r.status in (200, 403, 404)
+    except AssertionError:
+        print(r.status, r.reason)
+        raise
+    if r.status == 200:
+        None
+    conn = httplib.HTTPConnection(ia_host)
+    path = ia_path + "/" + item_id + "_scandata.xml"
+    conn.request('HEAD', path)
+    r = conn.getresponse()
+    try:
+        assert r.status in (200, 403, 404)
+    except AssertionError:
+        print(ia_host, path)
+        print(r.status, r.reason)
+        raise
+    return 'http://' + ia_host + path if r.status == 200 else None
+
+def scandata_zip_test(ia_host, ia_path):
+    conn = httplib.HTTPConnection(ia_host)
+    conn.request('HEAD', ia_path + "/scandata.zip")
+    r1 = conn.getresponse()
+    try:
+        assert r1.status in (200, 403, 404)
+    except AssertionError:
+        print(r1.status, r1.reason)
+        raise
+    return r1.status
+
+
+
+def urlread(url):
+    return urllib.request.urlopen(url).read()
+
+def post_cover(ol, source_url):
+    param = urllib.parse.urlencode({'olid': ol[3:], 'source_url': source_url})
+    headers = {"Content-type": "application/x-www-form-urlencoded"}
+    conn = httplib.HTTPConnection("covers.openlibrary.org", timeout=20)
+    conn.request("POST", "/b/upload", param, headers)
+    r1 = conn.getresponse()
+    print(r1.status, r1.reason)
+    if r1.status not in (200, 303, 500):
+        open('upload.html', 'w').write(r1.read())
+        print(r1.getheaders())
+        print(r1.msg)
+        sys.exit()
+    conn.close()
+
+def post(ol, ia, ia_host, ia_path, cover, title):
+    use_cover = False
+    if title is None:
+        if cover is None:
+            return
+        use_cover = True
+#    http://covers.openlibrary.org/b/query?olid=OL7232120M
+    if False and not use_cover:
+        data = urlread('http://openlibrary.org/query.json?key=/b/OL7232119M&publish_date=')
+        try:
+            ret = eval(data)
+        except:
+            print(repr(data))
+        pub_date = ret[0]['publish_date']
+        use_cover = pub_date.isdigit() and int(pub_date) > 1955
+    leaf = cover if use_cover else title
+    source_url = "http://%s/GnuBook/GnuBookImages.php?zip=%s/%s_jp2.zip&file=%s_jp2/%s_%04d.jp2" % (ia_host, ia_path, ia, ia, ia, leaf)
+#    print leaf, source_url
+    query = 'https://covers.openlibrary.org/b/query?olid=' + ol[3:]
+    #print query
+    if use_cover:
+        print('use_cover', end=' ')
+    print('https://openlibrary.org' + ol)
+    for attempt in range(5):
+        if attempt > 0:
+            print('trying again (%d)' % attempt)
+        try:
+            ret = urlread(query).strip()
+        except IOError:
+            continue
+        print(ret)
+        if not re_single_cover.match(ret):
+            print("unexpected reply: '%s'" % ret)
+            break
+        try:
+            write_log(ol, ia, source_url)
+            post_cover(ol, source_url)
+        except socket.timeout:
+            print('socket timeout')
+            break
+        except httplib.BadStatusLine:
+            print('bad status line')
+            continue
+        break
+
+bad_hosts = set()
+
+def find_img(item_id):
+    e = query({'type':'/type/edition', 'source_records':'ia:' + item_id})
+    if len(e) != 1:
+        print('no source_records:', e)
+        e = query({'type':'/type/edition', 'ocaid': item_id})
+        if len(e) != 1:
+            print('no ocaid:', e)
+            return
+    ol = e[0]['key']
+    (ia_host, ia_path) = find_item(item_id)
+
+    if not ia_host:
+        print('no host', item_id, ia_host)
+        return
+    if ia_host in bad_hosts:
+        print('bad_host')
+    try:
+        url = scandata_url(ia_host, ia_path, item_id)
+        if not url:
+            return
+    except socket.error:
+        print('socket error:', ia_host)
+        bad_hosts.add(ia_host)
+        return
+
+    try:
+        status = jp2_zip_test(ia_host, ia_path, item_id)
+    except socket.error:
+        print('socket error:', ia_host)
+        bad_hosts.add(ia_host)
+        return
+    if status in (403, 404):
+        print('jp2 not found:', (ol, item_id))
+        return
+
+    try:
+        (cover, title) = find_title_leaf_et(ia_host, ia_path, url)
+    except (KeyboardInterrupt, SystemExit, NameError):
+        raise
+    if not cover or not title:
+        return
+#    except:
+#        print 'skip error:', ol, item_id, ia_host, ia_path
+#        return
+    print((ol, item_id, ia_host, ia_path, cover, title))
+    post(ol, item_id, ia_host, ia_path, cover, title)
+
+def has_cover_retry(key):
+    for attempt in range(5):
+        try:
+            return has_cover(key)
+        except KeyboardInterrupt:
+            raise
+        except:
+            pass
+        sleep(2)
+
+skip = True
+skip = False
+for line in open('/1/edward/jsondump/2009-07-29/has_ocaid'):
+    key = line[:-1]
+    if key == '/b/OL6539962M': # the end
+        break
+    if skip:
+        if key == '/b/OL6539962M':
+            skip = False
+        else:
+            continue
+    if not has_cover_retry(key):
+        print('no cover')
+        continue
+    print(key)
+    e = withKey(key)
+    if not e.get('ocaid', None):
+        print('no ocaid')
+        continue
+    find_img(e['ocaid'].strip())
+
+fh_log.close()
+
+print('finished')
diff --git a/ia-legacy-importer/treasury/parse.py b/ia-legacy-importer/treasury/parse.py
new file mode 100644
index 00000000..cdf415ad
--- /dev/null
+++ b/ia-legacy-importer/treasury/parse.py
@@ -0,0 +1,71 @@
+from __future__ import print_function
+import re
+import sys
+import xml.etree.ElementTree as et
+from pprint import pprint
+
+def parse_catrecord(catrecord):
+    record = {}
+    re_bad_tag = re.compile(r'(<[^>]*?\s[^>]*?>)')
+    re_white = re.compile(r'\s')
+    catrecord = re_bad_tag.sub(lambda m: re_white.sub('', m.group(1)), catrecord)
+    tree = et.fromstring(catrecord)
+    record = {}
+    for e in tree:
+        f = e.tag.lower()
+        if e.tag == 'AUTHORS':
+            assert f not in record
+            record[f] = [(a.tag.lower(), a.text) for a in e]
+            continue
+        if e.tag == 'SEGMENT':
+            d = dict([(a.tag.lower(), a.text) for a in e])
+            record.setdefault(f, []).append(d)
+            continue
+        elif e.tag in ('SUBJ', 'COLL', 'ALTTI', 'SERIES'):
+            record.setdefault(f, []).append(e.text)
+            continue
+        assert len(e) == 0
+        assert f not in record
+        record[f] = e.text
+    return record
+
+def parse_file():
+    cur = ''
+    expect = 'start'
+    i = 0
+    re_call = re.compile('^<CALL>(.*)</CALL>\r\n$')
+    re_itemid = re.compile('^<ITEMID>(.*)</ITEMID>\r\n$')
+    for line in open(sys.argv[1]):
+        i+=1
+        assert expect != 'end_file'
+        if expect == 'start':
+            assert line == '<LIBRARY>Department of Treasury\r\n'
+            expect = 'start_catrecord'
+            continue
+        if expect == 'start_catrecord':
+            if line == '</CATRECORD>\r\n':
+                print("skipping duplicate CATRECORD")
+                continue
+            assert line == '<CATRECORD>\r\n'
+            cur += line
+            expect = 'end_catrecord'
+            continue
+        if expect == 'end_catrecord':
+            if line.startswith('</CATRECORD>'):
+                cur += '</CATRECORD>'
+                yield parse_catrecord(cur)
+
+                cur = ''
+                if line == '</CATRECORD></LIBRARY>\r\n':
+                    expect = 'end_file'
+                else:
+                    assert line == '</CATRECORD>\r\n'
+                    expect = 'start_catrecord'
+                continue
+            else:
+                cur += line
+
+    assert expect == 'end_file'
+
+for rec in parse_file():
+    pprint(rec)
diff --git a/ia-legacy-importer/update_count.py b/ia-legacy-importer/update_count.py
new file mode 100644
index 00000000..c36edb00
--- /dev/null
+++ b/ia-legacy-importer/update_count.py
@@ -0,0 +1,71 @@
+from olwrite import Infogami, add_to_database
+import web
+import dbhash
+from read_rc import read_rc
+import cjson
+import re
+import sys
+from time import time
+
+def commify(n):
+    """
+Add commas to an integer repr(n).
+
+>>> commify(1)
+'1'
+>>> commify(123)
+'123'
+>>> commify(1234)
+'1,234'
+>>> commify(1234567890)
+'1,234,567,890'
+>>> commify(None)
+>>>
+"""
+    if n is None: return None
+    r = []
+    for i, c in enumerate(reversed(str(n))):
+        if i and (not (i % 3)):
+            r.insert(0, ',')
+        r.insert(0, c)
+    return ''.join(r)
+
+def count_books():
+    rows = list(web.query("select count(*) as num from thing where type=52"))
+    return rows[0].num
+
+def count_fulltext():
+    rows = list(web.query("select count(*) as num from edition_str where key_id=40"))
+    return commify(rows[0].num)
+
+def get_macro():
+    rows = list(web.query("select data from data, thing where thing_id=thing.id and key='/macros/BookCount' and revision=latest_revision"))
+    return cjson.decode(rows[0].data)['macro']['value']
+
+rc = read_rc()
+web.config.db_parameters = dict(dbn='postgres', db=rc['db'], user=rc['user'], pw=rc['pw'], host=rc['host'])
+web.config.db_printing = False
+web.ctx.ip = '127.0.0.1'
+web.load()
+
+book_count = count_books()
+open('/home/edward/book_count', 'a').write("%d %d\n" % (time(), book_count))
+
+infogami = Infogami(rc['infogami'])
+infogami.login('edward', rc['edward'])
+
+macro = get_macro()
+re_books = re.compile(r'books = "<strong>[\d,]+</strong>"')
+books = commify(book_count)
+macro = re_books.sub('books = "<strong>' + books + '</strong>"', macro)
+
+# full text count is disabled so that the number stays about 1 million
+# fulltext = count_fulltext()
+# re_fulltext = re.compile(r'fulltext = "<strong>[\d,]+</strong>"')
+# macro = re_fulltext.sub('fulltext = "<strong>' + fulltext + '</strong>"', macro)
+
+q = {
+    'key': '/macros/BookCount',
+    'macro': { 'connect': 'update', 'type': '/type/text', 'value': macro }
+}
+infogami.write(q, comment='update book count')
diff --git a/ia-legacy-importer/utils/__init__.py b/ia-legacy-importer/utils/__init__.py
new file mode 100644
index 00000000..abba2342
--- /dev/null
+++ b/ia-legacy-importer/utils/__init__.py
@@ -0,0 +1,277 @@
+# -*- coding: utf-8 -*-
+import re
+import web
+from unicodedata import normalize
+import openlibrary.catalog.merge.normalize as merge
+
+import six
+
+try:
+    cmp = cmp       # Python 2
+except NameError:
+    def cmp(x, y):  # Python 3
+        return (x > y) - (x < y)
+
+
+re_date = map (re.compile, [
+    r'(?P<birth_date>\d+\??)-(?P<death_date>\d+\??)',
+    r'(?P<birth_date>\d+\??)-',
+    r'b\.? (?P<birth_date>(?:ca\. )?\d+\??)',
+    r'd\.? (?P<death_date>(?:ca\. )?\d+\??)',
+    r'(?P<birth_date>.*\d+.*)-(?P<death_date>.*\d+.*)',
+    r'^(?P<birth_date>[^-]*\d+[^-]+ cent\.[^-]*)$'])
+
+re_ad_bc = re.compile(r'\b(B\.C\.?|A\.D\.?)')
+re_date_fl = re.compile('^fl[., ]')
+re_number_dot = re.compile(r'\d{2,}[- ]*(\.+)$')
+re_l_in_date = re.compile(r'(l\d|\dl)')
+re_end_dot = re.compile(r'[^ .][^ .]\.$', re.UNICODE)
+re_marc_name = re.compile('^(.*?),+ (.*)$')
+re_year = re.compile(r'\b(\d{4})\b')
+
+re_brackets = re.compile(r'^(.+)\[.*?\]$')
+
+
+def key_int(rec):
+    # extract the number from a key like /a/OL1234A
+    return int(web.numify(rec['key']))
+
+
+def author_dates_match(a, b):
+    """
+    Checks if the years of two authors match. Only compares years,
+    not names or keys. Works by returning False if any year specified in one record
+    does not match that in the other, otherwise True. If any one author does not have
+    dates, it will return True.
+
+    :param dict a: Author import dict {"name": "Some One", "birth_date": "1960"}
+    :param dict b: Author import dict {"name": "Some One"}
+    :rtype: bool
+    """
+    for k in ['birth_date', 'death_date', 'date']:
+        if k not in a or a[k] is None or k not in b or b[k] is None:
+            continue
+        if a[k] == b[k] or a[k].startswith(b[k]) or b[k].startswith(a[k]):
+            continue
+        m1 = re_year.search(a[k])
+        if not m1:
+            return False
+        m2 = re_year.search(b[k])
+        if m2 and m1.group(1) == m2.group(1):
+            continue
+        return False
+    return True
+
+
+def flip_name(name):
+    """
+    Flip author name about the comma, stripping the comma, and removing non
+    abbreviated end dots. Returns name with end dot stripped if no comma+space found.
+    The intent is to convert a Library indexed name to natural name order.
+
+    :param str name: e.g. "Smith, John." or "Smith, J."
+    :rtype: str
+    :return: e.g. "John Smith" or "J. Smith"
+    """
+
+    m = re_end_dot.search(name)
+    if m:
+        name = name[:-1]
+    if name.find(', ') == -1:
+        return name
+    m = re_marc_name.match(name)
+    return m.group(2) + ' ' + m.group(1)
+
+
+def remove_trailing_number_dot(date):
+    m = re_number_dot.search(date)
+    if m:
+        return date[:-len(m.group(1))]
+    else:
+        return date
+
+def remove_trailing_dot(s):
+    if s.endswith(" Dept."):
+        return s
+    m = re_end_dot.search(s)
+    if m:
+        s = s[:-1]
+    return s
+
+def fix_l_in_date(date):
+    if not 'l' in date:
+        return date
+    return re_l_in_date.sub(lambda m:m.group(1).replace('l', '1'), date)
+
+re_ca = re.compile('ca\.([^ ])')
+
+def parse_date(date):
+    if re_date_fl.match(date):
+        return {}
+    date = remove_trailing_number_dot(date)
+    date = re_ca.sub(lambda m:'ca. ' + m.group(1), date)
+    if date.find('-') == -1:
+        for r in re_date:
+            m = r.search(date)
+            if m:
+                return dict((k, fix_l_in_date(v)) for k, v in m.groupdict().items())
+        return {}
+
+    parts = date.split('-')
+    i = { 'birth_date': parts[0].strip() }
+    if len(parts) == 2:
+        parts[1] = parts[1].strip()
+        if parts[1]:
+            i['death_date'] = fix_l_in_date(parts[1])
+            if not re_ad_bc.search(i['birth_date']):
+                m = re_ad_bc.search(i['death_date'])
+                if m:
+                    i['birth_date'] += ' ' + m.group(1)
+    if 'birth_date' in i and 'l' in i['birth_date']:
+        i['birth_date'] = fix_l_in_date(i['birth_date'])
+    return i
+
+re_cent = re.compile('^[\dl][^-]+ cent\.$')
+
+def pick_first_date(dates):
+    # this is to handle this case:
+    # 100: $aLogan, Olive (Logan), $cSikes, $dMrs., $d1839-
+    # see http://archive.org/download/gettheebehindmes00logaiala/gettheebehindmes00logaiala_meta.mrc
+    # or http://pharosdb.us.archive.org:9090/show-marc?record=gettheebehindmes00logaiala/gettheebehindmes00logaiala_meta.mrc:0:521
+
+    dates = list(dates)
+    if len(dates) == 1 and re_cent.match(dates[0]):
+        return { 'date': fix_l_in_date(dates[0]) }
+
+    for date in dates:
+        result = parse_date(date)
+        if result != {}:
+            return result
+
+    return { 'date': fix_l_in_date(' '.join([remove_trailing_number_dot(d) for d in dates])) }
+
+def strip_accents(s):
+    return normalize('NFKD', six.text_type(s)).encode('ASCII', 'ignore')
+
+re_drop = re.compile('[?,]')
+
+def match_with_bad_chars(a, b):
+    if six.text_type(a) == six.text_type(b):
+        return True
+    a = normalize('NFKD', six.text_type(a)).lower()
+    b = normalize('NFKD', six.text_type(b)).lower()
+    if a == b:
+        return True
+    a = a.encode('ASCII', 'ignore')
+    b = b.encode('ASCII', 'ignore')
+    if a == b:
+        return True
+    def drop(s):
+        return re_drop.sub('', s)
+    return drop(a) == drop(b)
+
+def accent_count(s):
+    return len([c for c in norm(s) if ord(c) > 127])
+
+def norm(s):
+    return normalize('NFC', s) if isinstance(s, six.text_type) else s
+
+def pick_best_name(names):
+    names = [norm(n) for n in names]
+    n1 = names[0]
+    assert all(match_with_bad_chars(n1, n2) for n2 in names[1:])
+    names.sort(key=lambda n:accent_count(n), reverse=True)
+    assert '?' not in names[0]
+    return names[0]
+
+def pick_best_author(authors):
+    n1 = authors[0]['name']
+    assert all(match_with_bad_chars(n1, a['name']) for a in authors[1:])
+    authors.sort(key=lambda a:accent_count(a['name']), reverse=True)
+    assert '?' not in authors[0]['name']
+    return authors[0]
+
+def tidy_isbn(input):
+    output = []
+    for i in input:
+        i = i.replace('-', '')
+        if len(i) in (10, 13):
+            output.append(i)
+            continue
+        if len(i) == 20 and all(c.isdigit() for c in i):
+            output.extend([i[:10], i[10:]])
+            continue
+        if len(i) == 21 and not i[10].isdigit():
+            output.extend([i[:10], i[11:]])
+            continue
+        if i.find(';') != -1:
+            no_semicolon = i.replace(';', '')
+            if len(no_semicolon) in (10, 13):
+                output.append(no_semicolon)
+                continue
+            split = i.split(';')
+            if all(len(j) in (10, 13) for j in split):
+                output.extend(split)
+                continue
+        output.append(i)
+    return output
+
+def strip_count(counts):
+    foo = {}
+    for i, j in counts:
+        foo.setdefault(i.rstrip('.').lower() if isinstance(i, six.string_types) else i, []).append((i, j))
+    ret = {}
+    for k, v in foo.iteritems():
+        m = max(v, key=lambda x: len(x[1]))[0]
+        bar = []
+        for i, j in v:
+            bar.extend(j)
+        ret[m] = bar
+    return sorted(ret.iteritems(), cmp=lambda x,y: cmp(len(y[1]), len(x[1]) ))
+
+def fmt_author(a):
+    if 'birth_date' in a or 'death_date' in a:
+        return "%s (%s-%s)" % ( a['name'], a.get('birth_date', ''), a.get('death_date', '') )
+    return a['name']
+
+def get_title(e):
+    if e.get('title_prefix', None) is not None:
+        prefix = e['title_prefix']
+        if prefix[-1] != ' ':
+            prefix += ' '
+        title = prefix + e['title']
+    else:
+        title = e['title']
+    return title
+
+
+def mk_norm(s):
+    """
+    Normalizes titles and strips ALL spaces and small words
+    to aid with string comparisons of two titles.
+
+    :param str s: A book title to normalize and strip.
+    :rtype: str
+    :return: a lowercase string with no spaces, containg the main words of the title.
+    """
+
+    m = re_brackets.match(s)
+    if m:
+        s = m.group(1)
+    norm = merge.normalize(s).strip(' ')
+    norm = norm.replace(' and ', ' ')
+    if norm.startswith('the '):
+        norm = norm[4:]
+    elif norm.startswith('a '):
+        norm = norm[2:]
+    return norm.replace(' ', '')
+
+
+def error_mail(msg_from, msg_to, subject, body):
+    assert isinstance(msg_to, list)
+    msg = 'From: %s\nTo: %s\nSubject: %s\n\n%s' % (msg_from, ', '.join(msg_to), subject, body)
+
+    import smtplib
+    server = smtplib.SMTP('mail.archive.org')
+    server.sendmail(msg_from, msg_to, msg)
+    server.quit()
diff --git a/ia-legacy-importer/utils/authority.py b/ia-legacy-importer/utils/authority.py
new file mode 100644
index 00000000..a0fcbee4
--- /dev/null
+++ b/ia-legacy-importer/utils/authority.py
@@ -0,0 +1,107 @@
+from __future__ import print_function
+from mechanize import Browser
+import re
+import os.path
+from openlibrary.catalog.read_rc import read_rc
+
+rc = read_rc()
+
+start = "http://authorities.loc.gov/cgi-bin/Pwebrecon.cgi?DB=local&PAGE=First"
+def get_table_rows(fh):
+    cur = ''
+    expect = 'thesauri'
+    for line in fh:
+        if expect == 'thesauri':
+            if line == '<TH><a href="/help/thesauri.htm">Type of Heading</a></TH>\n':
+                expect = 'headings_close_tr'
+                continue
+        if expect == 'headings_close_tr':
+            assert line == '</TR>\n'
+            expect = 'tr'
+            continue
+        if expect == 'tr':
+            assert line == '<TR>\n'
+            expect = 'center'
+            continue
+        if expect == 'center':
+            if line == '<TR>\n':
+                yield cur.decode('utf-8')
+                cur = ''
+            elif line == '</CENTER>\n':
+                yield cur.decode('utf-8')
+                break
+            else:
+                cur += line
+            continue
+
+re_row = re.compile('^<TD ALIGN=RIGHT VALIGN=TOP >\n<A HREF="/cgi-bin/Pwebrecon\.cgi\?(.*)"\n><IMG SRC="/images/([^.]+)\.gif" BORDER=0 ALT="(?:[^"]+)"></A>\n(\d+)\n</TD>\n<TD ALIGN=RIGHT>\n(\d+)\n</TD>\n<TD ALIGN=LEFT>\n(.+)\n</TD>\n<TD ALIGN=LEFT>\n(.+)\n</TD>\n$')
+re_no_link = re.compile('^<TD ALIGN=RIGHT VALIGN=TOP >\n</A>\n\d+\n</TD>\n<TD ALIGN=RIGHT>')
+
+def read_serp(fh):
+    cur_row = 0
+    for row in get_table_rows(fh):
+        cur_row += 1
+        if re_no_link.match(row):
+            continue
+        m = re_row.match(row)
+        if not m:
+            print(row)
+        (param, a, row_num, bib_records, heading, type_of_heading) = m.groups()
+        assert str(cur_row) == row_num
+        yield {
+            'a': a,
+            'bib_records': bib_records,
+            'heading': heading,
+            'type': type_of_heading
+        }
+
+def search(arg):
+    assert '/' not in arg # because we use it in a filename
+    cache = rc['authority_cache']
+    filename = cache + '/' + arg
+    if os.path.exists(filename):
+        return [eval(i) for i in open(filename)]
+    br = Browser()
+    br.set_handle_robots(False)
+    br.open(start)
+    br.select_form(name="querybox")
+    br['Search_Arg'] = arg.encode('utf-8')
+    br['Search_Code'] = ['NHED_']
+    res = br.submit()
+    found = list(read_serp(res))
+    br.close()
+    out = open(filename, 'w')
+    for i in found:
+        print(i, file=out)
+    out.close()
+    return found
+
+def test_harold_osman_kelly():
+    arg = 'Kelly, Harold Osman'
+    found = search(arg)
+    assert found[0]['heading'] == 'Kelly, Harold Osman, 1884-1955'
+
+def test_jesus():
+    arg = 'Jesus Christ'
+    found = search(arg)
+    assert found[0]['heading'] == 'Jesus Christ'
+
+def test_pope_sixtus():
+    arg = 'Sixtus V Pope'
+    found = search(arg)
+    assert found[0]['heading'] == 'Sixtus V, Pope, 1520-1590'
+
+def test_william_the_conqueror():
+    arg = 'William I King of England'
+    found = search(arg)
+    assert found[0]['heading'] == 'William I, King of England, 1027 or 8-1087'
+
+def test_non_ascii_result():
+    arg = 'Asoka King of Magadha'
+    found = search(arg)
+    assert found[0]['heading'] == u'As\u0301oka, King of Magadha, fl. 259 B.C.'
+
+def test_non_ascii_param():
+    arg = u'A\u015boka King of Magadha'
+    found = search(arg)
+    assert found[0]['heading'] == u'As\u0301oka, King of Magadha, fl. 259 B.C.'
diff --git a/ia-legacy-importer/utils/del.py b/ia-legacy-importer/utils/del.py
new file mode 100644
index 00000000..e01bfca3
--- /dev/null
+++ b/ia-legacy-importer/utils/del.py
@@ -0,0 +1,25 @@
+from __future__ import print_function
+from catalog.infostore import get_site
+from catalog.olwrite import Infogami
+from catalog.read_rc import read_rc
+
+rc = read_rc()
+infogami = Infogami(rc['infogami'])
+
+site = get_site()
+
+# throwaway bit of code for deleting bad scan records
+# BPL can't scan microtext
+
+keys = site.things({'type': '/type/scan_record', 'locations': '/scanning_center/MBMBN/BPL1MI', 'scan_status': 'NOT_SCANNED'})
+while keys:
+    for key in keys:
+        sr = site.withKey(key)
+        print(key)
+        q = {
+            'key': key,
+            'type': { 'connect': 'update', 'value': '/type/delete' },
+        }
+        ret = infogami.write(q, comment="can't scan microtext")
+        assert ret['status'] == 'ok'
+    keys = site.things({'type': '/type/scan_record', 'locations': '/scanning_center/MBMBN/BPL1MI', 'scan_status': 'NOT_SCANNED'})
diff --git a/ia-legacy-importer/utils/edit.py b/ia-legacy-importer/utils/edit.py
new file mode 100644
index 00000000..ec94e755
--- /dev/null
+++ b/ia-legacy-importer/utils/edit.py
@@ -0,0 +1,105 @@
+from __future__ import print_function
+import re
+import web
+import json
+from openlibrary.catalog.importer.db_read import get_mc
+from openlibrary.api import unmarshal
+from time import sleep
+
+import six
+from six.moves import urllib
+
+re_meta_mrc = re.compile('([^/]+)_(meta|marc).(mrc|xml)')
+re_skip = re.compile(r'\b([A-Z]|Co|Dr|Jr|Capt|Mr|Mrs|Ms|Prof|Rev|Revd|Hon)\.$')
+
+db_amazon = web.database(dbn='postgres', db='amazon')
+db_amazon.printing = False
+
+def query_with_retry(ol, q):
+    for attempt in range(50):
+        try:
+            return ol.query(q)
+        except:
+            sleep(5)
+            print('retry attempt', attempt)
+
+def get_with_retry(ol, k):
+    for attempt in range(50):
+        try:
+            return ol.get(k)
+        except:
+            sleep(5)
+            print('retry attempt', attempt)
+
+def amazon_source_records(asin):
+    iter = db_amazon.select('amazon', where='asin = $asin', vars={'asin':asin})
+    return ["amazon:%s:%s:%d:%d" % (asin, r.seg, r.start, r.length) for r in iter]
+
+def has_dot(s):
+    return s.endswith('.') and not re_skip.search(s)
+
+def fix_toc(e):
+    toc = e.get('table_of_contents', None)
+    if not toc:
+        return
+    if isinstance(toc[0], dict) and toc[0]['type'] == '/type/toc_item':
+        if len(toc) == 1 and 'title' not in toc[0]:
+            del e['table_of_contents'] # remove empty toc
+        return
+    new_toc = [{'title': six.text_type(i), 'type': '/type/toc_item'} for i in toc if i]
+    e['table_of_contents'] = new_toc
+
+def fix_subject(e):
+    if e.get('subjects', None) and any(has_dot(s) for s in e['subjects']):
+        subjects = [s[:-1] if has_dot(s) else s for s in e['subjects']]
+        e['subjects'] = subjects
+
+def undelete_author(a, ol):
+    key = a['key']
+    assert a['type'] == '/type/delete'
+    url = 'http://openlibrary.org' + key + '.json?v=' + str(a['revision'] - 1)
+    prev = unmarshal(json.load(urllib.request.urlopen(url)))
+    assert prev['type'] == '/type/author'
+    ol.save(key, prev, 'undelete author')
+
+def undelete_authors(authors, ol):
+    for a in authors:
+        if a['type'] == '/type/delete':
+            undelete_author(a, ol)
+        else:
+            assert a['type'] == '/type/author'
+
+def fix_authors(e, ol):
+    if 'authors' not in e:
+        return
+    authors = [get_with_retry(ol, akey) for akey in e['authors']]
+    while any(a['type'] == '/type/redirect' for a in authors):
+        print('following redirects')
+        authors = [get_with_retry(ol, a['location']) if a['type'] == '/type/redirect' else a for a in authors]
+    e['authors'] = [{'key': a['key']} for a in authors]
+    undelete_authors(authors, ol)
+
+def fix_edition(key, e, ol):
+    existing = get_mc(key)
+    if 'source_records' not in e and existing:
+        amazon = 'amazon:'
+        if existing.startswith('ia:'):
+            sr = [existing]
+        elif existing.startswith(amazon):
+            sr = amazon_source_records(existing[len(amazon):]) or [existing]
+        else:
+            print('existing:', existing)
+            m = re_meta_mrc.search(existing)
+            sr = ['marc:' + existing if not m else 'ia:' + m.group(1)]
+        e['source_records'] = sr
+    if 'ocaid' in e:
+        ia = 'ia:' + e['ocaid']
+        if 'source_records' not in e:
+            e['source_records'] = [ia]
+        elif ia not in e['source_records']:
+            e['source_records'].append(ia)
+
+    fix_toc(e)
+    fix_subject(e)
+    fix_authors(e, ol)
+    return e
diff --git a/ia-legacy-importer/utils/query.py b/ia-legacy-importer/utils/query.py
new file mode 100644
index 00000000..d42f4190
--- /dev/null
+++ b/ia-legacy-importer/utils/query.py
@@ -0,0 +1,162 @@
+from __future__ import print_function
+import web
+import simplejson as json
+from time import sleep
+import sys
+
+from six.moves import urllib
+
+
+query_host = 'openlibrary.org'
+
+def urlopen(url, data=None):
+    version = "%s.%s.%s" % sys.version_info[:3]
+    user_agent = 'Mozilla/5.0 (openlibrary; %s) Python/%s' % (__name__, version)
+    headers = {
+        'User-Agent': user_agent
+    }
+    req = urllib.request.Request(url, data, headers)
+    return urllib.request.urlopen(req)
+
+def jsonload(url):
+    return json.load(urlopen(url))
+
+def urlread(url):
+    return urlopen(url).read()
+
+def set_query_host(host):
+    global query_host
+    query_host = host
+
+def has_cover(key):
+    url = 'https://covers.openlibrary.org/' + key[1] + '/query?olid=' + key[3:]
+    return urlread(url).strip() != '[]'
+
+def has_cover_retry(key):
+    for attempt in range(5):
+        try:
+            return has_cover(key)
+        except KeyboardInterrupt:
+            raise
+        except:
+            pass
+        sleep(2)
+
+def base_url():
+    return "http://" + query_host
+
+def query_url():
+    return base_url() + "/query.json?query="
+
+def get_all_ia():
+    print('c')
+    q = {'source_records~': 'ia:*', 'type': '/type/edition'}
+    limit = 10
+    q['limit'] = limit
+    q['offset'] = 0
+
+    while True:
+        url = base_url() + "/api/things?query=" + web.urlquote(json.dumps(q))
+        ret = jsonload(url)['result']
+        for i in ret:
+            yield i
+        if not ret:
+            return
+        q['offset'] += limit
+
+def query(q):
+    url = query_url() + urllib.parse.quote(json.dumps(q))
+    ret = None
+    for i in range(20):
+        try:
+            ret = urlread(url)
+            while ret.startswith('canceling statement due to statement timeout'):
+                ret = urlread(url)
+            if not ret:
+                print('ret == None')
+        except IOError:
+            pass
+        if ret:
+            try:
+                data = json.loads(ret)
+                if isinstance(data, dict):
+                    if 'error' in data:
+                        print('error:')
+                        print(ret)
+                    assert 'error' not in data
+                return data
+            except:
+                print(ret)
+                print(url)
+        sleep(20)
+
+def query_iter(q, limit=500, offset=0):
+    q['limit'] = limit
+    q['offset'] = offset
+    while True:
+        ret = query(q)
+        if not ret:
+            return
+        for i in ret:
+            yield i
+        # We haven't got as many we have requested. No point making one more request
+        if len(ret) < limit:
+            break
+        q['offset'] += limit
+
+def get_editions_with_covers_by_author(author, count):
+    q = {'type': '/type/edition', 'title_prefix': None, 'subtitle': None, 'title': None, 'authors': author}
+    with_covers = []
+    for e in query_iter(q, limit=count):
+        if not has_cover(e['key']):
+            continue
+        with_covers.append(e)
+        if len(with_covers) == count:
+            return with_covers
+    return with_covers
+
+def version_iter(q, limit=500, offset=0):
+    q['limit'] = limit
+    q['offset'] = offset
+    while True:
+        url = base_url() + '/version'
+        v = jsonload(url)
+        if not v:
+            return
+        for i in query(q):
+            yield i
+        q['offset'] += limit
+
+def withKey(key):
+    url = base_url() + key + '.json'
+    for i in range(20):
+        try:
+            return jsonload(url)
+        except:
+            pass
+        print('retry:', i)
+        print(url)
+
+def get_marc_src(e):
+    mc = get_mc(e['key'])
+    if mc:
+        yield mc
+    if not e.get('source_records', []):
+        return
+    for src in e['source_records']:
+        if src.startswith('marc:') and src != 'marc:' + mc:
+            yield src[5:]
+
+def get_mc(key): # get machine comment
+    v = jsonload(base_url() + key + '.json?m=history')
+
+    comments = [i['machine_comment'] for i in v if i.get('machine_comment', None) and ':' in i['machine_comment']]
+    if len(comments) == 0:
+        return None
+    if len(set(comments)) != 1:
+        print(key)
+        print(comments)
+    assert len(set(comments)) == 1
+    if comments[0] == 'initial import':
+        return None
+    return comments[0]
diff --git a/ia-legacy-importer/wikipedia/__init__.py b/ia-legacy-importer/wikipedia/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/ia-legacy-importer/wikipedia/find_ol_authors.py b/ia-legacy-importer/wikipedia/find_ol_authors.py
new file mode 100644
index 00000000..78d01bce
--- /dev/null
+++ b/ia-legacy-importer/wikipedia/find_ol_authors.py
@@ -0,0 +1,28 @@
+from __future__ import print_function
+from catalog.utils import pick_first_date
+import web
+import re
+import sys
+import codecs
+sys.stdout = codecs.getwriter('utf-8')(sys.stdout)
+
+re_marc_name = re.compile('^(.*), (.*)$')
+re_end_dot = re.compile('[^ ][^ ]\.$', re.UNICODE)
+
+def flip_name(name):
+    # strip end dots like this: "Smith, John." but not like this: "Smith, J."
+    m = re_end_dot.search(name)
+    if m:
+        name = name[:-1]
+
+    m = re_marc_name.match(name)
+    return m.group(2) + ' ' + m.group(1)
+
+for wikipedia, marc in (eval(i) for i in open("matches4")):
+    dates = pick_first_date(v for k, v in marc if k == 'd')
+    name = ' '.join(v for k, v in marc if k in 'abc')
+    print(name)
+    if ', ' in name:
+        print(flip_name(name))
+    print(dates)
+
diff --git a/ia-legacy-importer/wikipedia/find_people.pl b/ia-legacy-importer/wikipedia/find_people.pl
new file mode 100644
index 00000000..243a7b75
--- /dev/null
+++ b/ia-legacy-importer/wikipedia/find_people.pl
@@ -0,0 +1,66 @@
+#!/usr/bin/perl
+
+use strict;
+use warnings;
+use lib '/home/edward/lib/perl5';
+use JSON::XS;
+use Parse::MediaWikiDump;
+
+#my $coder = JSON::XS->new->ascii;
+my $coder = JSON::XS->new->utf8;
+
+#binmode STDOUT, ":utf8";
+
+open my $fh, "-|", "curl http://download.wikimedia.org/enwiki/20081008/enwiki-20081008-pages-articles.xml.bz2 | bzip2 -dc -" or die $!;
+my $pages = Parse::MediaWikiDump::Pages->new($fh);
+
+sub get_template {
+    my ($template, $text) = @_;
+    $text =~ /({{\s*$template)/igc or return;
+    my $depth = 1;
+    my $infobox = $1;
+    while ($depth) {
+        unless ($text =~ /\G(.*?({{|}}))/sgc) {
+            return;
+        }
+        $infobox .= $1;
+        $2 eq '}}' and do { $depth--; next };
+        $2 eq '{{' and do { $depth++; next };
+    }
+    return $infobox;
+}
+
+my $page;
+open my $redirect, ">", 'redirects' or die;
+open my $people, ">", 'people' or die;
+while(defined($page = $pages->next)) {
+    $page->namespace and next;
+    if ($page->redirect) {
+        print $redirect $coder->encode([$page->title, $page->redirect]), "\n";
+        next;
+    }
+    my $cats = $page->categories;
+    $cats or next;
+    my $text = ${$page->text};
+    my $len = length($text);
+    my $skip = 1;
+    for (@$cats) {
+        /(writer|people|birth|death)/ or next;
+        $skip = 0;
+        last;
+    }
+    $skip and next;
+    my %out = (
+        title => $page->title,
+        cats => $cats,
+        len => $len,
+    );
+    for (qw(persondata defaultsort infobox lifetime)) {
+        my $template = get_template($_, $text);
+        $template and $out{$_} = $template;
+    }
+    print $people $coder->encode(\%out), "\n";
+}
+
+close $redirect;
+close $people;
diff --git a/ia-legacy-importer/wikipedia/lookup.py b/ia-legacy-importer/wikipedia/lookup.py
new file mode 100644
index 00000000..7407d261
--- /dev/null
+++ b/ia-legacy-importer/wikipedia/lookup.py
@@ -0,0 +1,521 @@
+from __future__ import print_function
+import web
+import re
+import codecs
+import sys
+from time import time
+from catalog.marc.fast_parse import get_subfields, get_all_subfields, get_subfield_values
+from catalog.utils import pick_first_date
+from unicodedata import normalize
+from pprint import pprint
+
+sys.stdout = codecs.getwriter('utf-8')(sys.stdout)
+
+# bad cats:
+# ... animal births
+# ... animal deaths
+# ... peoples
+
+db = web.database(dbn='postgres', db='wiki_people')
+db.printing = False
+
+re_comma = re.compile(', *')
+
+re_marc_name = re.compile('^(.*), (.*)$')
+
+def flip_name(name):
+    m = re_marc_name.match(name)
+    if m:
+        return m.group(2) + ' ' + m.group(1)
+    return name
+
+re_title_of = re.compile('^(.*) (of .*)$')
+
+re_digit = re.compile('\d+')
+re_decade = re.compile('^(\d+)s$')
+re_bc_date = re.compile('^(.*) B\.C\.?$')
+re_cent = re.compile('^(?:fl\.? ?)?(\d+)[a-z]{0,2}\.? cent\.$')
+# fl. 13th cent/14th cent.
+re_cent_range = re.compile('^(?:fl\.? ?)?(\d+)[a-z]{0,2}\.?(?: cent)?[-/](\d+)[a-z]{0,2}\.? cent\.$')
+re_century = re.compile('^(\d+)[a-z][a-z] century$')
+
+def decade_match(a, start, ca):
+    end = start + 10
+    if ca:
+        start -= 9
+        end += 9
+    if a.isdigit():
+        return start <= int(a) < end
+    return any((start <= int(c) < end) for c in re_digit.findall(a))
+
+def year_approx_match(a, b):
+    approx_century_match = False
+    if a.startswith('ca. '):
+        ca = True
+        a = a[4:]
+        range = 15
+    else:
+        ca = False
+        range = 9
+    if a == b:
+        return True
+    if a.replace('.', '') == b:
+        return True # ca. 440 B.C.
+    if a.endswith(' cent.') and b.endswith(' century') and b.startswith(a[:-1]):
+        return True
+
+    bc = False
+    if b.endswith(' BC'):
+        m = re_bc_date.match(a)
+        if m:
+            a = m.group(1)
+            b = b[:-3]
+            bc = True
+    if approx_century_match and a.isdigit() and b.endswith(' century'):
+        a = int(a)
+        m = re_century.match(b)
+        assert m
+        cent = int(m.group(1))
+        start = cent - 1 if not bc else cent
+        end = cent if not bc else cent + 1
+        if start * 100 <= a < end * 100:
+            return True
+
+    if b.isdigit():
+        b = int(b)
+        if a.isdigit() and (bc or b < 1850) and abs(int(a) - b) <= range:
+            return True
+        if approx_century_match and a.endswith(' cent.'):
+            m = re_cent.match(a)
+            if m:
+                cent = int(m.group(1))
+                start = cent - 1 if not bc else cent
+                end = cent if not bc else cent + 1
+                if start * 100 <= b < end * 100:
+                    return True
+        for c in re_digit.findall(a):
+            c = int(c)
+            if c == b:
+                return True
+            if (bc or b < 1850) and abs(c - b) <= range:
+                return True
+        return False
+    m = re_decade.match(b)
+    if not m:
+        return False
+    start = int(m.group(1))
+    return decade_match(a, start, ca)
+
+def test_year_approx_match():
+    assert not year_approx_match('1939', '1940')
+    assert year_approx_match('582', '6th century')
+    assert year_approx_match('13th cent.', '1240')
+    assert year_approx_match('ca. 360 B.C.', '365 BC')
+    assert year_approx_match('1889', '1890')
+    assert year_approx_match('1883?', '1882')
+    assert year_approx_match('1328?', '1320s')
+    assert year_approx_match('11th cent.', '11th century')
+    assert not year_approx_match('1330', '1320s')
+    assert not year_approx_match('245 B.C.', '3rd century BC')
+
+#test_year_approx_match()
+
+# fl. 13th cent/14th cent.
+def cent_range(c):
+    m = re_cent_range.match(c)
+    if m:
+        a, b = int(m.group(1)), int(m.group(2))
+        assert b == a + 1
+        return ((a-1) * 100, b * 100)
+    m = re_cent.match(c)
+    assert m
+    a = int(m.group(1))
+    return ((a-1) * 100, a * 100)
+
+re_fl = re.compile('^fl\.? ?(\d+)\.?$')
+
+def get_birth_and_death(cats):
+    birth = None
+    death = None
+    for c in cats:
+        if c.endswith(' births'):
+            birth = c[:-7]
+            continue
+        elif c.endswith(' deaths'):
+            death = c[:-7]
+            continue
+    return birth, death
+
+re_century_writers_cat = re.compile('(\d+)[a-z]{2}-century.* writers')
+
+def date_match(dates, cats):
+    match_found = False
+    if len(dates) == 1 and 'date' in dates:
+        marc = dates['date']
+        if marc.startswith('fl.'):
+            m = re_fl.match(marc)
+            if m:
+                birth, death = get_birth_and_death(cats)
+                if birth and death and birth.isdigit() and death.isdigit():
+                    return int(birth) < int(m.group(1)) < int(death)
+        if marc.endswith(' cent.'):
+            m = re_cent.match(marc)
+            if m:
+                cent = marc[:-6] + '-century'
+                if any(c.endswith(' writers') and cent in c for c in cats):
+                    return True
+            m = re_cent_range.match(marc)
+            if m:
+                if any(cm.group(1) in m.groups() for cm in (re_century_writers_cat.match(c) for c in cats) if cm):
+                    return True
+
+            try:
+                (a, b) = cent_range(marc)
+            except:
+                print(marc)
+                raise
+            for c in cats:
+                for f in (' births', ' deaths'):
+                    if not c.endswith(f):
+                        continue
+                    date = c[:-len(f)]
+                    if date.isdigit():
+                        if a < int(date) < b:
+                            match_found = True
+                        else:
+                            return False
+                    else:
+                        if year_approx_match(marc, date):
+                            match_found = True
+                        else:
+                            return False
+
+        return match_found
+
+    for f in ['birth', 'death']:
+        if f + '_date' not in dates:
+            continue
+        marc = dates[f + '_date']
+        this_cats = [i[:-(len(f)+2)] for i in cats if i.endswith(' %ss' % f)]
+        if not this_cats:
+            continue
+        m = any(year_approx_match(marc, i) for i in this_cats)
+        if m:
+            match_found = True
+        else:
+            return False
+    return match_found
+
+def norm_name(n):
+    return re_comma.sub(' ', n).lower()
+
+# example: "Ibn Daud, Abraham ben David," -> "Ibn Daud"
+re_name_comma = re.compile('^([^, ]+ [^, ]+)?, [^ ]')
+
+def name_lookup(fields):
+    def join_fields(fields, want):
+        return ' '.join(v for k, v in fields if k in want)
+
+    fields = [(k, v.lower()) for k, v in fields]
+
+    if not any(k == 'd' for k, v in fields):
+        return []
+    ab = [v for k, v in fields if k in 'ab']
+    name = ' '.join(ab)
+    flipped = flip_name(name)
+    names = set([name, flipped])
+
+    a = join_fields(fields, 'a')
+    m = re_name_comma.match(a)
+    if m:
+        names.add(m.group(1))
+
+    #names = set([flipped])
+    if any(k == 'c' for k, v in fields):
+        name = join_fields(fields, 'abc')
+        names.update([name, flip_name(name)])
+        title = [v for k, v in fields if k in 'c']
+        names.update([' '.join(title + ab), ' '.join(title + [flipped])])
+        title = ' '.join(title)
+        names.update(["%s (%s)" % (name, title), "%s (%s)" % (flipped, title)])
+        sp = title.find(' ')
+        if sp != -1:
+            m = re_title_of.search(title)
+            if m:
+                role, of_place = m.groups()
+                names.update([' '.join(ab + [of_place]), ' '.join([flipped, of_place])])
+                names.update([' '.join([role] + ab + [of_place]), ' '.join([role, flipped, of_place])])
+
+            t = title[:sp]
+            names.update([' '.join([t] + ab), ' '.join([t, flipped])])
+        if 'of st. ' in title: # for "Richard of St. Victor"
+            names.update([i.replace('of st.', 'of saint') for i in names])
+
+    found = []
+    for n in set(re_comma.sub(' ', n) for n in names):
+        iter = db.query("select title, cats, name, persondata from names, people where people.id = names.person_id and name=$n", {'n':n})
+        x = [(i.title, eval(i.cats), i.name, i.persondata) for i in iter if not i.title.startswith('Personal life of ')]
+        found += x
+    return found
+
+noble_or_clergy = ['King', 'Queen', 'Prince', 'Princess', 'Duke', 'Archduke', 'Baron', 'Pope', 'Antipope', 'Bishop', 'Archbishop']
+re_noble_or_clergy = re.compile('(' + '|'.join( noble_or_clergy ) + ')')
+
+def strip_brackets(line):
+    if line[4] == '[' and line[-2] == ']':
+        return line[0:4] + line[5:-2] + line[-1]
+    else:
+        return line
+
+def fmt_line(fields):
+    def bold(s):
+        return ''.join(i + '\b' + i for i in s)
+    def norm(s):
+        return normalize('NFC', s)
+    return ''.join(bold("$" + k) + norm(v) for k, v in fields)
+
+def pick_from_match(match):
+    l = [(norm_name(k), v) for k, v in match.items()]
+    good = [(k, v) for k, v in l if any(k == m for m in v['match_name'])]
+    if len(good) == 1:
+        return dict(good)
+    exact_date = [(k, v) for k, v in l if v['exact_dates']]
+    if len(exact_date) == 1:
+        return dict(exact_date)
+    if len(exact_date) > 1 and len(good) > 1:
+        exact_date = [(k, v) for k, v in good if v['exact_dates']]
+        if len(exact_date) == 1:
+            return dict(exact_date)
+    return match
+
+def more_than_one_match(match):
+    return [("http://en.wikipedia.org/wiki/" + name.replace(' ', '_'), i) for name, i in match.items()]
+
+def test_date_match():
+    # $aAngelico,$cfra,$dca. 1400-l455.
+    dates = {'birth_date': u'ca. 1400', 'death_date': u'1455'}
+    cats = [u'1395 births', u'1455 deaths']
+    assert date_match(dates, cats)
+
+    # $aAndocides,$dca. 440-ca. 390 B.C.
+    dates = {'birth_date': u'ca. 440 B.C.', 'death_date': u'ca. 390 B.C.'}
+    cats = [u'440 BC births', u'390 BC deaths', u'Ancient Athenians']
+    assert date_match(dates, cats)
+
+    # $aAlexander,$cof Hales,$dca. 1185-1245.
+    dates = {'birth_date': u'ca. 1185', 'death_date': u'1245'}
+    cats = [u'13th century philosophers', u'1245 deaths', u'Roman Catholic philosophers', u'English theologians', u'Franciscans', u'Scholastic philosophers', u'People from Gloucestershire']
+    assert date_match(dates, cats)
+
+    dates = {'birth_date': u'1922'}
+    cats = [u'1830 births', u'1876 deaths']
+    assert not date_match(dates, cats)
+
+    dates = {'birth_date': u'1889', 'death_date': u'1947'}
+    cats = [u'1890 births', u'1947 deaths']
+    assert date_match(dates, cats)
+
+    dates = {'birth_date': u'1889', 'death_date': u'1947'}
+    cats = [u'1890 births', u'1947 deaths']
+    assert date_match(dates, cats)
+
+    dates = {}
+    cats = [u'1890 births', u'1947 deaths']
+    assert not date_match(dates, cats)
+
+    dates = {'birth_date': u'1883?', 'death_date': u'1963'}
+    cats = [u'1882 births', u'1963 deaths']
+    assert date_match(dates, cats)
+
+    dates = {'birth_date': u'1328?', 'death_date': u'1369'}
+    cats = [u'Karaite rabbis', u'1320s births', u'1369 deaths']
+    assert date_match(dates, cats)
+
+    dates = {'birth_date': u'ca. 1110', 'death_date': u'ca. 1180'}
+    cats = [u'1120s births', u'1198 deaths']
+    assert date_match(dates, cats)
+
+    # $aAbu Nuwas,$dca. 756-ca. 810.  # Abu Nuwas
+    dates = {'birth_date': u'ca. 756', 'death_date': u'ca. 810'}
+    cats = [u'750 births', u'810 deaths']
+    assert date_match(dates, cats)
+
+date_cats = (' births', ' deaths', 'century writers', 'century Latin writers', 'century women writers', 'century French writers') # time for an regexp
+
+def exact_date_match(dates, cats):
+    if 'date' in dates or not all(i in dates for i in ('birth_date', 'death_date')):
+        return False
+    if any('ca.' in i for i in dates.values()):
+        return False
+    birth, death = get_birth_and_death(cats)
+    return dates['birth_date'] == birth and dates['death_date'] == death
+
+def look_for_match(found, dates, verbose):
+    match = {}
+    for name, cats, match_name, pd in found:
+        found_name_match = norm_name(name) == match_name
+        #seen.add(name)
+        if not any(any(cat.endswith(i) for i in date_cats) for cat in cats):
+            if False and not found_name_match:
+                print('name match, but no date cats')
+                print(name, cats, match_name)
+                print(dates)
+                print()
+            continue
+        exact_dm = exact_date_match(dates, cats)
+        dm = exact_dm or date_match(dates, cats)
+        if not dm and found_name_match:
+            if 'death_date' in dates:
+                death = dates['death_date']
+                if death + ' deaths' in cats:
+                    dm = True
+            elif 'birth_date' in dates:
+                birth = dates['birth_date']
+                if birth.isdigit():
+                    assert birth + ' births' not in cats
+        if dm:
+            if name in match:
+                match[name]['match_name'].append(match_name)
+            else:
+                match[name] = {'cats': cats, 'exact_dates': exact_dm, 'match_name': [match_name]}
+        if not verbose:
+            continue
+        print((name, match_name))
+        print("cats =", cats)
+        print(('match' if dm else 'no match'))
+        for field in ['birth', 'death']:
+            print(field + 's:', [i[:-(len(field)+2)] for i in cats if i.endswith(' %ss' % field)], end=' ')
+        print()
+    if verbose:
+        print('---')
+    return match
+
+def test_lookup():
+    line = '00\x1faEgeria,\x1fd4th/5th cent.\x1e' # count=3
+    wiki = 'Egeria (pilgrim)'
+    print(fmt_line(get_subfields(line, 'abcd')))
+    fields = tuple((k, v.strip(' /,;:')) for k, v in get_subfields(line, 'abcd'))
+    print(fields)
+    found = name_lookup(fields)
+    print(found)
+    dates = pick_first_date(v for k, v in fields if k == 'd')
+    assert dates.items()[0] != ('date', '')
+    print(dates)
+    print()
+    print(look_for_match(found, dates, True))
+
+#test_lookup()
+
+def test_lookup2():
+    line = '00\x1faRichard,\x1fcof St. Victor,\x1fdd. 1173.\x1e'
+    print(fmt_line(get_subfields(line, 'abcd')))
+    fields = tuple((k, v.strip(' /,;:')) for k, v in get_subfields(line, 'abcd'))
+    print(fields)
+    found = name_lookup(fields)
+    dates = pick_first_date(v for k, v in fields if k == 'd')
+    assert dates.items()[0] != ('date', '')
+    print(dates)
+    print()
+    match = look_for_match(found, dates, False)
+    pprint(match)
+    print()
+    match = pick_from_match(match)
+    pprint(match)
+
+def test_lookup3():
+    line = '00\x1faJohn,\x1fcof Paris,\x1fd1240?-1306.\x1e'
+    print(fmt_line(get_subfields(line, 'abcd')))
+    fields = tuple((k, v.strip(' /,;:')) for k, v in get_subfields(line, 'abcd'))
+    print(fields)
+    found = name_lookup(fields)
+#    print [i for i in found if 'Paris' in i[0]]
+#    found = [(u'John of Paris', [u'Christian philosophers', u'Dominicans', u'Roman Catholic theologians', u'13th-century Latin writers', u'1255 births', u'1306 deaths'], u'john of paris', None)]
+    dates = pick_first_date(v for k, v in fields if k == 'd')
+    match = look_for_match(found, dates, False)
+    match = pick_from_match(match)
+    pprint(match)
+
+def test_lookup4():
+    fields = (('a', 'Forbes, George'), ('d', '1849-1936.'))
+    found = name_lookup(fields)
+    dates = pick_first_date(v for k, v in fields if k == 'd')
+    match = look_for_match(found, dates, False)
+    for k, v in match.iteritems():
+        print(k, v)
+    match = pick_from_match(match)
+    pprint(match)
+
+#test_lookup4()
+
+def db_marc_lookup():
+    verbose = False
+    articles = set()
+    count = 0
+    count_with_date = 0
+    t0 = time()
+    match_count = 0
+    total = 3596802
+    prev_fields = None
+    fh = open('matches', 'w')
+    bad = codecs.open('more_than_one_match', 'w', 'utf8')
+    for line in open('/1/edward/wikipedia/marc_authors2'):
+        count+=1
+#        (author_count, line) = eval(line)
+        (line, author_count) = eval(line)
+#        line = strip_brackets(line)
+        if count % 5000 == 0:
+            t1 = time() - t0
+            rec_per_sec = count / t1
+            time_left = (total - count) / rec_per_sec
+            #print fmt_line(get_subfields(line, 'abcd'))
+#            print list(get_subfields(line, 'abcd'))
+            print(line)
+            print(count, count_with_date, match_count, "%.2f%% %.2f mins left" % (float(match_count * 100.0) / float(count_with_date), time_left / 60))
+        fields = tuple((k, v.strip(' /,;:')) for k, v in line)
+        if prev_fields == fields:
+            continue
+        prev_fields = fields
+        dates = pick_first_date(v for k, v in fields if k == 'd')
+        if dates.items()[0] == ('date', ''):
+            continue
+        count_with_date += 1
+        if verbose:
+            print(line)
+            print(dates)
+        is_noble_or_clergy = any(k =='c' and re_noble_or_clergy.search(v) for k, v in fields)
+        found = name_lookup(fields)
+        if not found:
+            continue
+            if is_noble_or_clergy:
+                print('noble or clergy not found:', line)
+                print()
+            continue
+        match = look_for_match(found, dates, verbose)
+
+        if not match:
+            continue
+            if is_noble_or_clergy:
+                print('noble or clergy not found:')
+                print(fmt_line(line))
+                print(found)
+                print()
+            continue
+        match_count+=1
+#        articles.add(match.keys()[0])
+        if len(match) != 1:
+            match = pick_from_match(match)
+        if len(match) != 1:
+            print("\n" + fmt_line(line), file=bad)
+            for i in more_than_one_match(match):
+                print(i, file=bad)
+        else:
+            #print (list(get_subfields(line, 'abcd')), match.keys()[0])
+            cats = match.values()[0]['cats']
+            exact = match.values()[0]['exact_dates']
+            dc = [i for i in cats if any(i.endswith(j) for j in date_cats)]
+            print((match.keys()[0], fields, author_count, dc, exact, 'Living people' in cats), file=fh)
+    print(match_count)
+    fh.close()
+
+if __name__ == '__main__':
+    db_marc_lookup()
diff --git a/ia-legacy-importer/wikipedia/process.py b/ia-legacy-importer/wikipedia/process.py
new file mode 100644
index 00000000..8a5dadf8
--- /dev/null
+++ b/ia-legacy-importer/wikipedia/process.py
@@ -0,0 +1,686 @@
+# coding=utf8
+from __future__ import print_function
+import bz2
+import codecs
+import sys
+import re
+import simplejson as json
+from catalog.marc.fast_parse import get_subfields, get_all_subfields, get_subfield_values
+from unicodedata import normalize
+import MySQLdb
+from catalog.utils import pick_first_date
+from time import time
+
+re_marc_name = re.compile('^(.*), (.*)$')
+
+def norm(s):
+    return normalize('NFC', s)
+
+def get_conn():
+    return MySQLdb.connect(passwd='', user='', use_unicode=True, charset='utf8', db='wiki_people')
+
+def get_cursor():
+    return get_conn().cursor()
+
+sys.stdout = codecs.getwriter('utf8')(sys.stdout)
+re_skip = re.compile('^(History|Demograph(ics|y)|Lists?) of')
+
+def list_names():
+    for line in bz2.BZ2File('people.bz2'):
+        cur = json.loads(line.decode('utf8'))
+        title = cur['title']
+        if re_skip.match(title):
+            continue
+        print(title)
+
+def redirects():
+    titles = set([line[:-1] for line in codecs.open('people_names', 'r', 'utf8')])
+
+    for line in bz2.BZ2File('redirects.bz2'):
+        (f, t) = json.loads(line.decode('utf8'))
+        t = t.replace('_', ' ')
+        if t in titles:
+            print((f, t))
+
+def redirect_dict():
+    redirects = {}
+    for line in open('people_redirects'):
+        (f, t) = eval(line)
+        t = t.replace('_', ' ')
+        redirects.setdefault(t, []).append(f)
+    print(redirects)
+
+def add_redirects():
+    redirects = eval(open('redirect_dict').read())
+    for line in bz2.BZ2File('people.bz2'):
+        cur = json.loads(line.decode('utf8'))
+        title = cur['title']
+        if re_skip.match(title):
+            continue
+        if title in redirects:
+            cur['redirects'] = redirects[title]
+        print(cur)
+
+#add_redirects()
+#redirect_dict()
+
+re_syntax = re.compile(r'(.*?)(\||{{|}}|\[\[|\]\])', re.DOTALL)
+re_html_comment = re.compile('<!-- .* -->')
+re_space_or_underscore = re.compile('[ _]')
+re_infobox_template = re.compile('^infobox[_ ]books?(?:\s*<!--.*-->)?\s*', re.I)
+re_persondata = re.compile('^Persondata\s*', re.I)
+
+re_line = re.compile('^\s*\|\s*([A-Z ]+?)\s*=\s*(.*?)\s*$')
+def parse_template2(s):
+    fields = {}
+    for l in s.split('\n'):
+        m = re_line.match(l)
+        if not m:
+            continue
+        name, value = m.groups()
+        fields[name.strip()] = value
+    return fields
+
+def parse_template(s, expected_name):
+    template_depth = 1
+    link_depth = 0
+    pos = 2
+    buf = ''
+
+    data = []
+    while template_depth > 0:
+        m = re_syntax.match(s[pos:])
+
+        pos = pos+m.end()
+        buf += m.group(1)
+        if m.group(2) == '{{':
+            buf += m.group(2)
+            template_depth += 1
+            continue
+
+        if m.group(2) == '[[':
+            buf += m.group(2)
+            link_depth += 1
+            continue
+
+        if template_depth == 1 and link_depth == 0:
+            data.append(buf)
+            buf = ''
+        elif m.group(2) == '|':
+            buf += '|'
+        if m.group(2) == '}}':
+            buf += m.group(2)
+            template_depth -= 1
+            continue
+        if m.group(2) == ']]':
+            buf += m.group(2)
+            if link_depth > 0:
+                link_depth -= 1
+            continue
+        assert m.group(2) == '|'
+    if buf != '}}':
+        return parse_template2(s)
+    assert buf == '}}'
+
+    template_name = data.pop(0)
+    try:
+        assert template_name.lstrip().lower().startswith(expected_name.lower())
+        #assert re_persondata.match(infobox_template)
+        #assert re_infobox_template.match(infobox_template)
+    except AssertionError:
+        print(template_name)
+        raise
+
+    fields = {}
+    for line in data:
+        line = line.strip();
+        if line == '' or ((line.startswith('<!--') or line.startswith('< --')) and line.endswith('-->')) or line == 'PLEASE SEE [[WP:PDATA]]!':
+            continue
+        if '=' in line:
+            name, value = line.split('=', 1)
+        else:
+            m = re_missing_equals.match(line)
+            if not m:
+                return parse_template2(s)
+            name, value = m.groups()
+        fields[name.strip()] = value.strip()
+    return fields
+
+re_missing_equals = re.compile('^([A-Z ]+) (.+)$')
+
+def parse_pd(pd):
+    lines = pd.split('\n')
+    print(repr(lines[-1]))
+    assert lines[-1] == '}}'
+
+def read_person_data():
+    expect = set([u'DATE OF DEATH', u'NAME', u'SHORT DESCRIPTION', u'ALTERNATIVE NAMES', u'PLACE OF BIRTH', u'DATE OF BIRTH', u'PLACE OF DEATH'])
+    for line in open('people'):
+        cur = eval(line)
+        if 'persondata' not in cur:
+            continue
+        title = cur['title']
+        if title == 'Murray Bookchin':
+            continue
+#        print 'title:', title
+        pd = cur['persondata']
+        k = set(parse_template(pd, 'persondata').keys())
+        if k > expect:
+            print(title)
+            print(k)
+
+def iter_people():
+    return (eval(line) for line in open('people'))
+
+def date_cats():
+    re_date_cat = re.compile('^(.*\d.*) (birth|death)s$')
+    cats = {'birth': {}, 'death':{}}
+    for cur in iter_people():
+        title = cur['title']
+        #print [cat for cat in cur['cats'] if cat.endswith('births') or cat.endswith('deaths')]
+        for cat in cur['cats']:
+            m = re_date_cat.match(cat)
+            if not m:
+                continue
+            cats[m.group(2)].setdefault(m.group(1), set()).add(title)
+#        print 'birth:', [(i[0], len(i[1])) for i in sorted(cats['birth'].items(), reverse = True, key = lambda i: len(i[1]))[:5]]
+#        print 'death:', [(i[0], len(i[1])) for i in sorted(cats['death'].items(), reverse = True, key = lambda i: len(i[1]))[:5]]
+    print(cats)
+
+#read_person_data()
+#date_cats()
+
+def fmt_line(fields):
+    def bold(s):
+        return ''.join(i + '\b' + i for i in s)
+    return ''.join(bold("$" + k) + norm(v) for k, v in fields)
+
+def strip_brackets(line):
+    if line[4] == '[' and line[-2] == ']':
+        return line[0:4] + line[5:-2] + line[-1]
+    else:
+        return line
+
+def read_marc():
+    for line in bz2.BZ2File('marc_authors.bz2'):
+        line = eval(line)
+        if '[Sound recording]' in line:
+            continue
+        line = strip_brackets(line)
+        #print expr_in_utf8(get_all_subfields(line))
+        print(fmt_line(get_subfields(line, 'abcd')))
+
+#read_marc()
+
+#   528,859 wikipedia
+# 3,596,802 MARC
+
+
+def get_names(cur):
+    titles = [cur['title']] + cur.get('redirects', [])
+    if 'persondata' in cur:
+        pd = parse_template(cur['persondata'], 'persondata')
+        if 'NAME' in pd and pd['NAME']:
+            titles.append(pd['NAME'])
+        if 'ALTERNATIVE NAMES' in pd:
+            alt = pd['ALTERNATIVE NAMES']
+            if len(alt) > 100 and ',' in alt and ';' not in alt:
+                alt = alt.split(',')
+            else:
+                alt = alt.split(';')
+            titles += [j for j in (i.strip() for i in alt) if j]
+    return set(i.lower() for i in titles)
+
+def read_people():
+    from collections import defaultdict
+#    wiki = []
+#    title_lookup = defaultdict(list)
+    maximum = 0
+    for cur in iter_people():
+#        wiki.append(cur)
+        titles = [cur['title']] + cur.get('redirects', [])
+        if 'persondata' in cur:
+            pd = parse_template(cur['persondata'], 'persondata')
+            if 'NAME' in pd and pd['NAME']:
+                titles.append(pd['NAME'])
+            if 'ALTERNATIVE NAMES' in pd:
+                alt = pd['ALTERNATIVE NAMES']
+                if len(alt) > 100 and ',' in alt and ';' not in alt:
+                    alt = alt.split(',')
+                else:
+                    alt = alt.split(';')
+                titles += [j for j in (i.strip() for i in alt) if j]
+        cur_max = max(len(i) for i in titles)
+        if cur_max > maximum:
+            maximum = cur_max
+            print(maximum)
+            print(cur['title'])
+            print(titles)
+#        for t in set(titles):
+#            title_lookup[t].append(cur)
+
+# filter names: Robert Bob Adam Hincmar Anselm
+
+# Personal life of Marcus Tullius Cicero
+
+def load_db():
+    c = get_cursor()
+    c.execute('truncate people')
+    c.execute('truncate names')
+    c.execute('truncate redirects')
+    for person in iter_people():
+#        print person
+        c.execute('insert into people (title, len, infobox, defaultsort, persondata, cats) values (%s, %s, %s, %s, %s, %s)', (person['title'], person['len'], person.get('infobox', None), person.get('defaultsort', None), person.get('persondata', None), repr(person.get('cats', []))))
+        id = conn.insert_id()
+        c.executemany('insert ignore into names (person_id, name) values (%s, %s)', [(id, n) for n in get_names(person)])
+        if 'redirects' in person:
+            redirects = set(r.lower() for r in person['redirects'])
+            c.executemany('insert ignore into redirects (person_id, redirect) values (%s, %s)', [(id, r) for r in redirects])
+
+re_lifetime = re.compile('\{\{lifetime\| *(\d+s?(?: BC)?|missing|unknown|\d\d?[a-z][a-z] century)? *(?:\| *(\d+s?(?: BC)?|living|unknown|missing|\d\d?[a-z][a-z] century)? *)?(?:\|([^|]*))?\}\}', re.I)
+
+def load_lifetime():
+    c = get_cursor()
+    for person in iter_people():
+        if 'lifetime' not in person:
+            continue
+        m = re_lifetime.match(person['lifetime'])
+        if not m:
+            continue
+        (birth, death, defaultsort) = m.groups()
+        cats = person.get('cats', [])
+#        print "select id from people where title='%s'" % person['title']
+        c.execute("select id from people where title=%s", (person['title'],))
+        (id,) = c.fetchone()
+        update_cats = False
+        if birth and birth.lower() not in ('missing', 'unknown'):
+            new_cat = birth + " births"
+            if new_cat not in cats:
+                cats.append(new_cat)
+                update_cats = True
+        if death and death.lower() not in ('missing', 'unknown', 'living'):
+            new_cat = death + " deaths"
+            if new_cat not in cats:
+                cats.append(new_cat)
+                update_cats = True
+        if update_cats:
+            print(person['title'])
+#            print 'update people set cats=%s where id=%s' % (repr(cats), id)
+            c.execute('update people set cats=%s where id=%s', (repr(cats), id))
+        if defaultsort:
+            add_to_names(c, id, defaultsort)
+
+re_defaultsort = re.compile('^{{defaultsort(?:key)?[;:|]\n?(.*)\n?}}$', re.I)
+
+re_comma = re.compile(', *')
+re_comma_and_space = re.compile('[, ]+')
+
+def add_to_names(c, id, name):
+    name = re_comma.sub(' ', name).lower().strip()
+    c.execute('insert ignore into names (person_id, name) values (%s, %s)', (id, name))
+
+def add_default_sort():
+    c = get_cursor()
+    c.execute("select id, title, defaultsort from people where defaultsort is not null")
+    for id, title, ds in c.fetchall():
+#        print id, ds
+        if title == 'Omar Gooding':
+            ds = '{{DEFAULTSORT:Gooding, Omar}}'
+        m = re_defaultsort.match(ds)
+        if not m:
+            print("http://en.wikipedia.org/wiki/" + title.replace(' ', '_'))
+            print(ds)
+        if m.group(1):
+            add_to_names(c, id, m.group(1))
+
+re_br_or_semicolon = re.compile('(?:</?br ?/?>|;)')
+re_strip = re.compile("(?:\([^)]*\)|<!--.*?-->|\[\[.*?\]\]|'''?)")
+re_strip2 = re.compile('(?:<.*?>|\{\{.*?\}\})')
+
+def add_names_from_infobox():
+    c = get_cursor()
+    c.execute("select id, title, infobox from people where infobox is not null")
+    for id, title, infobox in c.fetchall():
+        try:
+            infobox = parse_template(infobox, 'infobox')
+        except AttributeError:
+            continue
+        for field in 'name', 'full name':
+            if field not in infobox or not infobox[field]:
+                continue
+            v = re_strip.sub('', infobox[field])
+#            v = infobox[field]
+            v = [i for i in (re_strip2.sub('', i).strip(' ,:') for i in re_br_or_semicolon.split(v)) if i]
+            for i in v:
+                i = re_comma_and_space.sub(' ', i)
+                if title != i:
+                    add_to_names(c, id, i)
+#            print title, ':', field, ':', infobox[field], v
+
+def strip_commas_from_names():
+    c = get_cursor()
+    c.execute("select person_id, name from names where name like '%,%'")
+    for id, name in c.fetchall():
+        new = re_comma.sub(' ', name)
+        if new == ' ' or new == name:
+            print((id, name, new))
+        assert new != ' ' and new != name
+        c.execute("update ignore names set name=%s where person_id=%s and name=%s", (new, id, name))
+
+#read_people()
+
+#load_db()
+
+def flip_name(name):
+    m = re_marc_name.match(name)
+    if m:
+        return m.group(2) + ' ' + m.group(1)
+    return name
+
+re_digit = re.compile('\d+')
+re_decade = re.compile('^(\d+)s$')
+re_bc_date = re.compile('^(.*) B\.C\.?$')
+re_cent = re.compile('^(\d+)[a-z][a-z] cent\.$')
+re_century = re.compile('^(\d+)[a-z][a-z] century$')
+
+def decade_match(a, start):
+    end = start + 10
+    if a.isdigit():
+        return start <= int(a) < end
+    return any((start <= int(c) < end) for c in re_digit.findall(a))
+
+def year_approx_match(a, b):
+    approx_century_match = False
+    if a.startswith('ca. '):
+        ca = True
+        a = a[4:]
+        range = 20
+    else:
+        ca = False
+        range = 9
+    if a == b:
+        return True
+    if a.replace('.', '') == b:
+        return True # ca. 440 B.C.
+    if a.endswith(' cent.') and b.endswith(' century') and b.startswith(a[:-1]):
+        return True
+
+    bc = False
+    if b.endswith(' BC'):
+        m = re_bc_date.match(a)
+        if m:
+            a = m.group(1)
+            b = b[:-3]
+            bc = True
+    if approx_century_match and a.isdigit() and b.endswith(' century'):
+        a = int(a)
+        m = re_century.match(b)
+        assert m
+        cent = int(m.group(1))
+        start = cent - 1 if not bc else cent
+        end = cent if not bc else cent + 1
+        #print cent, start, a, end
+        if start * 100 <= a < end * 100:
+            return True
+
+    if b.isdigit():
+        b = int(b)
+        if a.isdigit() and (bc or b < 1850) and abs(int(a) - b) <= range:
+            return True
+        if approx_century_match and a.endswith(' cent.'):
+            m = re_cent.match(a)
+            if m:
+                cent = int(m.group(1))
+                start = cent - 1 if not bc else cent
+                end = cent if not bc else cent + 1
+                if start * 100 <= b < end * 100:
+                    return True
+        for c in re_digit.findall(a):
+            c = int(c)
+            if c == b:
+                return True
+            if (bc or b < 1850) and abs(c - b) <= range:
+                return True
+        return False
+    m = re_decade.match(b)
+    if not m:
+        return False
+    start = int(m.group(1))
+    return decade_match(a, start)
+
+def test_year_approx_match():
+    assert not year_approx_match('1939', '1940')
+    assert year_approx_match('582', '6th century')
+    assert year_approx_match('13th cent.', '1240')
+    assert year_approx_match('ca. 360 B.C.', '365 BC')
+    assert year_approx_match('1889', '1890')
+    assert year_approx_match('1883?', '1882')
+    assert year_approx_match('1328?', '1320s')
+    assert year_approx_match('11th cent.', '11th century')
+    assert not year_approx_match('1330', '1320s')
+    assert not year_approx_match('245 B.C.', '3rd century BC')
+
+def date_match(dates, cats):
+    match_found = False
+    for f in ['birth', 'death']:
+        if f + '_date' not in dates:
+            continue
+        marc = dates[f + '_date']
+        this_cats = [i[:-(len(f)+2)] for i in cats if i.endswith(' %ss' % f)]
+        if not this_cats:
+            continue
+        m = any(year_approx_match(marc, i) for i in this_cats)
+        #print m, marc, this_cats
+        if m:
+            match_found = True
+        else:
+            return False
+    return match_found
+
+def test_date_match():
+    # $aAngelico,$cfra,$dca. 1400-l455.
+    dates = {'birth_date': u'ca. 1400', 'death_date': u'1455'}
+    cats = [u'1395 births', u'1455 deaths']
+    assert date_match(dates, cats)
+
+    # $aAndocides,$dca. 440-ca. 390 B.C.
+    dates = {'birth_date': u'ca. 440 B.C.', 'death_date': u'ca. 390 B.C.'}
+    cats = [u'440 BC births', u'390 BC deaths', u'Ancient Athenians']
+    assert date_match(dates, cats)
+
+    # $aAlexander,$cof Hales,$dca. 1185-1245.
+    dates = {'birth_date': u'ca. 1185', 'death_date': u'1245'}
+    cats = [u'13th century philosophers', u'1245 deaths', u'Roman Catholic philosophers', u'English theologians', u'Franciscans', u'Scholastic philosophers', u'People from Gloucestershire']
+    assert date_match(dates, cats)
+
+    dates = {'birth_date': u'1922'}
+    cats = [u'1830 births', u'1876 deaths']
+    assert not date_match(dates, cats)
+
+    dates = {'birth_date': u'1889', 'death_date': u'1947'}
+    cats = [u'1890 births', u'1947 deaths']
+    assert date_match(dates, cats)
+
+    dates = {'birth_date': u'1889', 'death_date': u'1947'}
+    cats = [u'1890 births', u'1947 deaths']
+    assert date_match(dates, cats)
+
+    dates = {}
+    cats = [u'1890 births', u'1947 deaths']
+    assert not date_match(dates, cats)
+
+    dates = {'birth_date': u'1883?', 'death_date': u'1963'}
+    cats = [u'1882 births', u'1963 deaths']
+    assert date_match(dates, cats)
+
+    dates = {'birth_date': u'1328?', 'death_date': u'1369'}
+    cats = [u'Karaite rabbis', u'1320s births', u'1369 deaths']
+    assert date_match(dates, cats)
+
+    dates = {'birth_date': u'ca. 1110', 'death_date': u'ca. 1180'}
+    cats = [u'1120s births', u'1198 deaths']
+    assert date_match(dates, cats)
+
+    # $aAbu Nuwas,$dca. 756-ca. 810.  # Abu Nuwas
+    dates = {'birth_date': u'ca. 756', 'death_date': u'ca. 810'}
+    cats = [u'750 births', u'810 deaths']
+    assert date_match(dates, cats)
+
+re_title_of = re.compile('^(.*) (of .*)$')
+
+def name_lookup(c, fields):
+    def join_fields(fields, want):
+        return ' '.join(v for k, v in fields if k in want)
+    if not any(k == 'd' for k, v in fields):
+        return []
+    ab = [v for k, v in fields if k in 'ab']
+    name = ' '.join(ab)
+    flipped = flip_name(name)
+    names = set([name, flipped])
+    #names = set([flipped])
+    if any(k == 'c' for k, v in fields):
+        name = join_fields(fields, 'abc')
+        names.update([name, flip_name(name)])
+        title = [v for k, v in fields if k in 'c']
+        names.update([' '.join(title + ab), ' '.join(title + [flipped])])
+        title = ' '.join(title)
+        names.update(["%s (%s)" % (name, title), "%s (%s)" % (flipped, title)])
+        sp = title.find(' ')
+        if sp != -1:
+            m = re_title_of.search(title)
+            if m:
+                role, of_place = m.groups()
+                names.update([' '.join(ab + [of_place]), ' '.join([flipped, of_place])])
+                names.update([' '.join([role] + ab + [of_place]), ' '.join([role, flipped, of_place])])
+
+            t = title[:sp]
+            names.update([' '.join([t] + ab), ' '.join([t, flipped])])
+
+    found = []
+    for n in set(re_comma.sub(' ', n) for n in names):
+        c.execute("select title, cats, name, persondata from names, people where people.id = names.person_id and name=%s", (n,))
+        found += c.fetchall()
+    return found
+
+# $aAleksandr Mikhaĭlovich,$cGrand Duke of Russia,$d1866-1933.
+# == Grand Duke Alexander Mikhailovich of Russia
+
+def pick_from_match(match):
+    good = [(name, (cats, match_name)) for name, (cats, match_name) in match.items() if name.lower() == match_name]
+    if len(good) == 1:
+        return dict(good)
+    return match
+
+def more_than_one_match(match):
+    for name, (cats, match_name) in match.items():
+        print(name, cats, match_name)
+        print("http://en.wikipedia.org/wiki/" + name.replace(' ', '_'))
+    print()
+
+#$aSmith, William,$d1769-1839
+#William Smith (geologist) [u'English geologists', u'Canal engineers', u'People from Oxfordshire', u'Somerset coalfield', u'1769 births', u'1839 deaths', u'People from Scarborough, North Yorkshire', u'Wollaston Medal winners'] william smith
+#http://en.wikipedia.org/wiki/William_Smith_(geologist)
+#William Smith (South Carolina senator) [u'1762 births', u'1840 deaths', u'United States Senators from South Carolina', u'Democratic Party (United States) vice presidential nominees', u'South Carolina lawyers'] william smith
+#http://en.wikipedia.org/wiki/William_Smith_(South_Carolina_senator)
+
+noble_or_clergy = ['King', 'Queen', 'Prince', 'Princess', 'Duke', 'Archduke', 'Baron', 'Pope', 'Antipope', 'Bishop', 'Archbishop']
+re_noble_or_clergy = re.compile('(' + '|'.join( noble_or_clergy ) + ')')
+
+def db_marc_lookup():
+    verbose = False
+    c = get_cursor()
+    articles = set()
+    count = 0
+    count_with_date = 0
+    t0 = time()
+    match_count = 0
+    total = 3596802
+    prev_fields = None
+    fh = open('matches3', 'w')
+    for line in bz2.BZ2File('marc_authors.bz2'):
+        count+=1
+        line = eval(line)
+        line = strip_brackets(line)
+        if count % 5000 == 0:
+            t1 = time() - t0
+            rec_per_sec = count / t1
+            time_left = (total - count) / rec_per_sec
+            print(fmt_line(get_subfields(line, 'abcd')))
+            print(count, count_with_date, match_count, "%.2f%% %.2f mins left" % (float(match_count * 100.0) / float(count_with_date), time_left / 60))
+        fields = tuple((k, v.strip(' /,;:')) for k, v in get_subfields(line, 'abcd'))
+        if prev_fields == fields:
+            continue
+        prev_fields = fields
+        dates = pick_first_date(v for k, v in fields if k == 'd')
+        if dates.items()[0] == ('date', ''):
+            continue
+        count_with_date += 1
+        if verbose:
+            print(fmt_line(get_subfields(line, 'abcd')))
+            print(dates)
+        is_noble_or_clergy = any(re_noble_or_clergy.search(v) \
+            for v in get_subfield_values(line, 'c'))
+        found = name_lookup(c, fields)
+        if not found:
+            continue
+            if is_noble_or_clergy:
+                print('noble or clergy not found:')
+                print(fmt_line(get_subfields(line, 'abcd')))
+                print()
+            continue
+        match = {}
+        seen = set()
+        for name, cats, match_name, pd in found:
+            if name in seen:
+                continue
+            seen.add(name)
+            cats = eval(cats)
+            if not any(cat.endswith(' births') or cat.endswith(' deaths') for cat in cats):
+                continue
+            dm = date_match(dates, cats)
+            if dm:
+                match[name] = (cats, match_name)
+            if not verbose:
+                continue
+            print((name, match_name))
+            print("cats =", cats)
+            print(('match' if dm else 'no match'))
+            for field in ['birth', 'death']:
+                print(field + 's:', [i[:-(len(field)+2)] for i in cats if i.endswith(' %ss' % field)], end=' ')
+            print()
+        if verbose:
+            print('---')
+
+        if not match:
+            continue
+            if is_noble_or_clergy:
+                print('noble or clergy not found:')
+                print(fmt_line(get_subfields(line, 'abcd')))
+                print(found)
+                print()
+            continue
+        match_count+=1
+#        articles.add(match.keys()[0])
+        if len(match) != 1:
+            match = pick_from_match(match)
+        if len(match) != 1:
+            print(count, match_count)
+            print(fmt_line(get_subfields(line, 'abcd')))
+            more_than_one_match(match)
+        else:
+            #print (list(get_subfields(line, 'abcd')), match.keys()[0])
+            print((match.keys()[0], fields), file=fh)
+        continue
+#        print len(articles), match[0][0], fmt_line(get_subfields(line, 'abcd'))
+        assert len(match) == 1
+    print(match_count)
+    fh.close()
+
+#add_names_from_infobox()
+#test_year_approx_match()
+db_marc_lookup()
+#test_date_match()
+#add_default_sort()
+#strip_commas_from_names()
+
+#load_lifetime()
diff --git a/ia-legacy-importer/wikipedia/read.py b/ia-legacy-importer/wikipedia/read.py
new file mode 100644
index 00000000..9c7f4c47
--- /dev/null
+++ b/ia-legacy-importer/wikipedia/read.py
@@ -0,0 +1,40 @@
+from __future__ import print_function
+import sys
+import codecs
+import re
+from catalog.marc.fast_parse import translate
+sys.stdout = codecs.getwriter('utf-8')(sys.stdout)
+
+prev = None
+cur_marc = []
+
+trans = {'&':'&amp;','<':'&lt;','>':'&gt;','\n':'<br>'}
+re_html_replace = re.compile('([&<>\n])')
+
+def esc(s):
+    return re_html_replace.sub(lambda m: trans[m.group(1)], s)
+
+def esc_sp(s):
+    return esc(s).replace(' ', '&nbsp;')
+
+print('<html>\n<head><title>Authors</title></head>\n<body>')
+
+print('87 authors with 10 or more variants in MARC records<br>')
+
+def html_subfields(marc):
+    return ''.join('<b>' + k + '</b>' + esc(translate(v)) for k, v in marc)
+
+for line in open("matches4"):
+    wiki, marc = eval(line)
+    if prev and prev != wiki:
+        if len(cur_marc) > 9:
+            print('<h2><a href="http://en.wikipedia.org/wiki/%s">%s</a></h2>' % (prev.replace(" ", "_"), prev))
+            print("%d variants in MARC records<br>" % len(cur_marc))
+            print("<ul>", ''.join("<li>%s</li>\n" % html_subfields(li) for li in cur_marc), "</ul>")
+#            for i in cur_marc:
+#                print '  ', i
+        cur_marc = []
+    cur_marc.append(marc)
+    prev = wiki
+
+print('</body>\n</html>')
diff --git a/ia-legacy-importer/wikipedia/tidy.py b/ia-legacy-importer/wikipedia/tidy.py
new file mode 100644
index 00000000..e4e51b7a
--- /dev/null
+++ b/ia-legacy-importer/wikipedia/tidy.py
@@ -0,0 +1,536 @@
+from __future__ import print_function
+import bz2
+import codecs
+import sys
+import re
+import simplejson as json
+from catalog.marc.fast_parse import get_subfields, get_all_subfields, get_subfield_values
+from unicodedata import normalize
+import MySQLdb
+from catalog.utils import pick_first_date
+from time import time
+
+re_marc_name = re.compile('^(.*), (.*)$')
+
+def norm(s):
+    return normalize('NFC', s)
+
+def get_conn():
+    return MySQLdb.connect(passwd='', user='', use_unicode=True, charset='utf8', db='wiki_people')
+
+def get_cursor():
+    return get_conn().cursor()
+
+
+
+sys.stdout = codecs.getwriter('utf8')(sys.stdout)
+re_skip = re.compile('^(History|Demograph(ics|y)|Lists?) of')
+
+def names():
+
+    for line in bz2.BZ2File('people.bz2'):
+        cur = json.loads(line.decode('utf8'))
+        title = cur['title']
+        if re_skip.match(title):
+            continue
+        print(title)
+
+def redirects():
+    titles = set([line[:-1] for line in codecs.open('people_names', 'r', 'utf8')])
+
+    for line in bz2.BZ2File('redirects.bz2'):
+        (f, t) = json.loads(line.decode('utf8'))
+        t = t.replace('_', ' ')
+        if t in titles:
+            print((f, t))
+
+def redirect_dict():
+    redirects = {}
+    for line in open('people_redirects'):
+        (f, t) = eval(line)
+        t = t.replace('_', ' ')
+        redirects.setdefault(t, []).append(f)
+    print(redirects)
+
+def add_redirects():
+    redirects = eval(open('redirect_dict').read())
+    for line in bz2.BZ2File('people.bz2'):
+        cur = json.loads(line.decode('utf8'))
+        title = cur['title']
+        if re_skip.match(title):
+            continue
+        if title in redirects:
+            cur['redirects'] = redirects[title]
+        print(cur)
+
+#add_redirects()
+#redirect_dict()
+
+re_syntax = re.compile(r'(.*?)(\||{{|}}|\[\[|\]\])', re.DOTALL)
+re_html_comment = re.compile('<!-- .* -->')
+re_space_or_underscore = re.compile('[ _]')
+re_infobox_template = re.compile('^infobox[_ ]books?(?:\s*<!--.*-->)?\s*', re.I)
+re_persondata = re.compile('^Persondata\s*', re.I)
+
+re_line = re.compile('^\s*\|\s*([A-Z ]+?)\s*=\s*(.*?)\s*$')
+def parse_template2(s):
+    fields = {}
+    for l in s.split('\n'):
+        m = re_line.match(l)
+        if not m:
+            continue
+        name, value = m.groups()
+        fields[name.strip()] = value
+    return fields
+
+def parse_template(s):
+    template_depth = 1
+    link_depth = 0
+    pos = 2
+    buf = ''
+
+    data = []
+    while template_depth > 0:
+        m = re_syntax.match(s[pos:])
+
+        pos = pos+m.end()
+        buf += m.group(1)
+        if m.group(2) == '{{':
+            buf += m.group(2)
+            template_depth += 1
+            continue
+
+        if m.group(2) == '[[':
+            buf += m.group(2)
+            link_depth += 1
+            continue
+
+        if template_depth == 1 and link_depth == 0:
+            data.append(buf)
+            buf = ''
+        if m.group(2) == '}}':
+            buf += m.group(2)
+            template_depth -= 1
+            continue
+        if m.group(2) == ']]':
+            buf += m.group(2)
+            if link_depth > 0:
+                link_depth -= 1
+            continue
+        assert m.group(2) == '|'
+    if buf != '}}':
+        return parse_template2(s)
+    assert buf == '}}'
+
+    infobox_template = data.pop(0)
+    try:
+        assert re_persondata.match(infobox_template)
+        #assert re_infobox_template.match(infobox_template)
+    except AssertionError:
+        print(infobox_template)
+        raise
+
+    fields = {}
+    for line in data:
+        line = line.strip();
+        if line == '' or ((line.startswith('<!--') or line.startswith('< --')) and line.endswith('-->')) or line == 'PLEASE SEE [[WP:PDATA]]!':
+            continue
+        if '=' in line:
+            name, value = line.split('=', 1)
+        else:
+            m = re_missing_equals.match(line)
+            if not m:
+                return parse_template2(s)
+            name, value = m.groups()
+        fields[name.strip()] = value.strip()
+    return fields
+
+re_missing_equals = re.compile('^([A-Z ]+) (.+)$')
+
+def parse_pd(pd):
+    lines = pd.split('\n')
+    print(repr(lines[-1]))
+    assert lines[-1] == '}}'
+
+def read_person_data():
+    expect = set([u'DATE OF DEATH', u'NAME', u'SHORT DESCRIPTION', u'ALTERNATIVE NAMES', u'PLACE OF BIRTH', u'DATE OF BIRTH', u'PLACE OF DEATH'])
+    for line in open('people'):
+        cur = eval(line)
+        if 'persondata' not in cur:
+            continue
+        title = cur['title']
+        if title == 'Murray Bookchin':
+            continue
+#        print 'title:', title
+        pd = cur['persondata']
+        k = set(parse_template(pd).keys())
+        if k > expect:
+            print(title)
+            print(k)
+
+def iter_people():
+    return (eval(line) for line in open('people'))
+
+def date_cats():
+    re_date_cat = re.compile('^(.*\d.*) (birth|death)s$')
+    cats = {'birth': {}, 'death':{}}
+    for cur in iter_people():
+        title = cur['title']
+        #print [cat for cat in cur['cats'] if cat.endswith('births') or cat.endswith('deaths')]
+        for cat in cur['cats']:
+            m = re_date_cat.match(cat)
+            if not m:
+                continue
+            cats[m.group(2)].setdefault(m.group(1), set()).add(title)
+#        print 'birth:', [(i[0], len(i[1])) for i in sorted(cats['birth'].items(), reverse = True, key = lambda i: len(i[1]))[:5]]
+#        print 'death:', [(i[0], len(i[1])) for i in sorted(cats['death'].items(), reverse = True, key = lambda i: len(i[1]))[:5]]
+    print(cats)
+
+#read_person_data()
+#date_cats()
+
+def fmt_line(fields):
+    def bold(s):
+        return ''.join(i + '\b' + i for i in s)
+    return ''.join(bold("$" + k) + norm(v) for k, v in fields)
+
+def strip_brackets(line):
+    if line[4] == '[' and line[-2] == ']':
+        return line[0:4] + line[5:-2] + line[-1]
+    else:
+        return line
+
+def read_marc():
+    for line in bz2.BZ2File('marc_authors.bz2'):
+        line = eval(line)
+        if '[Sound recording]' in line:
+            continue
+        line = strip_brackets(line)
+        #print expr_in_utf8(get_all_subfields(line))
+        print(fmt_line(get_subfields(line, 'abcd')))
+
+#read_marc()
+
+#   528,859 wikipedia
+# 3,596,802 MARC
+
+
+def get_names(cur):
+    titles = [cur['title']] + cur.get('redirects', [])
+    if 'persondata' in cur:
+        pd = parse_template(cur['persondata'])
+        if 'NAME' in pd and pd['NAME']:
+            titles.append(pd['NAME'])
+        if 'ALTERNATIVE NAMES' in pd:
+            alt = pd['ALTERNATIVE NAMES']
+            if len(alt) > 100 and ',' in alt and ';' not in alt:
+                alt = alt.split(',')
+            else:
+                alt = alt.split(';')
+            titles += [j for j in (i.strip() for i in alt) if j]
+    return set(i.lower() for i in titles)
+
+def read_people():
+    from collections import defaultdict
+#    wiki = []
+#    title_lookup = defaultdict(list)
+    maximum = 0
+    for cur in iter_people():
+#        wiki.append(cur)
+        titles = [cur['title']] + cur.get('redirects', [])
+        if 'persondata' in cur:
+            pd = parse_template(cur['persondata'])
+            if 'NAME' in pd and pd['NAME']:
+                titles.append(pd['NAME'])
+            if 'ALTERNATIVE NAMES' in pd:
+                alt = pd['ALTERNATIVE NAMES']
+                if len(alt) > 100 and ',' in alt and ';' not in alt:
+                    alt = alt.split(',')
+                else:
+                    alt = alt.split(';')
+                titles += [j for j in (i.strip() for i in alt) if j]
+        cur_max = max(len(i) for i in titles)
+        if cur_max > maximum:
+            maximum = cur_max
+            print(maximum)
+            print(cur['title'])
+            print(titles)
+#        for t in set(titles):
+#            title_lookup[t].append(cur)
+
+def load_db():
+    c = get_cursor()
+    c.execute('truncate people')
+    c.execute('truncate names')
+    c.execute('truncate redirects')
+    for person in iter_people():
+#        print person
+        c.execute('insert into people (title, len, infobox, defaultsort, persondata, cats) values (%s, %s, %s, %s, %s, %s)', (person['title'], person['len'], person.get('infobox', None), person.get('defaultsort', None), person.get('persondata', None), repr(person.get('cats', []))))
+        id = conn.insert_id()
+        c.executemany('insert ignore into names (person_id, name) values (%s, %s)', [(id, n) for n in get_names(person)])
+        if 'redirects' in person:
+            redirects = set(r.lower() for r in person['redirects'])
+            c.executemany('insert ignore into redirects (person_id, redirect) values (%s, %s)', [(id, r) for r in redirects])
+
+#        print 'insert into
+
+#read_people()
+
+#load_db()
+
+def flip_name(name):
+    m = re_marc_name.match(name)
+    if m:
+        return m.group(2) + ' ' + m.group(1)
+    return name
+
+re_digit = re.compile('\d+')
+re_decade = re.compile('^(\d+)s$')
+re_bc_date = re.compile('^(.*) B\.C\.?$')
+re_cent = re.compile('^(\d+)[a-z][a-z] cent\.$')
+re_century = re.compile('^(\d+)[a-z][a-z] century$')
+
+def decade_match(a, start):
+    end = start + 10
+    if a.isdigit():
+        return start <= int(a) < end
+    return any((start <= int(c) < end) for c in re_digit.findall(a))
+
+def year_approx_match(a, b):
+    approx_century_match = False
+    if a.startswith('ca. '):
+        ca = True
+        a = a[4:]
+        range = 20
+    else:
+        ca = False
+        range = 9
+    if a == b:
+        return True
+    if a.replace('.', '') == b:
+        return True # ca. 440 B.C.
+    if a.endswith(' cent.') and b.endswith(' century') and b.startswith(a[:-1]):
+        return True
+
+    bc = False
+    if b.endswith(' BC'):
+        m = re_bc_date.match(a)
+        if m:
+            a = m.group(1)
+            b = b[:-3]
+            bc = True
+    if approx_century_match and a.isdigit() and b.endswith(' century'):
+        a = int(a)
+        m = re_century.match(b)
+        assert m
+        cent = int(m.group(1))
+        start = cent - 1 if not bc else cent
+        end = cent if not bc else cent + 1
+        #print cent, start, a, end
+        if start * 100 <= a < end * 100:
+            return True
+
+    if b.isdigit():
+        b = int(b)
+        if a.isdigit() and (bc or b < 1900) and abs(int(a) - b) <= range:
+            return True
+        if approx_century_match and a.endswith(' cent.'):
+            m = re_cent.match(a)
+            if m:
+                cent = int(m.group(1))
+                start = cent - 1 if not bc else cent
+                end = cent if not bc else cent + 1
+                if start * 100 <= b < end * 100:
+                    return True
+        for c in re_digit.findall(a):
+            c = int(c)
+            if c == b:
+                return True
+            if (bc or b < 1900) and abs(c - b) <= range:
+                return True
+        return False
+    m = re_decade.match(b)
+    if not m:
+        return False
+    start = int(m.group(1))
+    return decade_match(a, start)
+
+def test_year_approx_match():
+    assert not year_approx_match('1939', '1940')
+    assert year_approx_match('582', '6th century')
+    assert year_approx_match('13th cent.', '1240')
+    assert year_approx_match('ca. 360 B.C.', '365 BC')
+    assert year_approx_match('1889', '1890')
+    assert year_approx_match('1883?', '1882')
+    assert year_approx_match('1328?', '1320s')
+    assert year_approx_match('11th cent.', '11th century')
+    assert not year_approx_match('1330', '1320s')
+    assert not year_approx_match('245 B.C.', '3rd century BC')
+
+def date_match(dates, cats):
+    match_found = False
+    for f in ['birth', 'death']:
+        if f + '_date' not in dates:
+            continue
+        marc = dates[f + '_date']
+        this_cats = [i[:-(len(f)+2)] for i in cats if i.endswith(' %ss' % f)]
+        if not this_cats:
+            continue
+        m = any(year_approx_match(marc, i) for i in this_cats)
+        #print m, marc, this_cats
+        if m:
+            match_found = True
+        else:
+            return False
+    return match_found
+
+def test_date_match():
+    # $aAngelico,$cfra,$dca. 1400-l455.
+    dates = {'birth_date': u'ca. 1400', 'death_date': u'1455'}
+    cats = [u'1395 births', u'1455 deaths']
+    assert date_match(dates, cats)
+
+    # $aAndocides,$dca. 440-ca. 390 B.C.
+    dates = {'birth_date': u'ca. 440 B.C.', 'death_date': u'ca. 390 B.C.'}
+    cats = [u'440 BC births', u'390 BC deaths', u'Ancient Athenians']
+    assert date_match(dates, cats)
+
+    # $aAlexander,$cof Hales,$dca. 1185-1245.
+    dates = {'birth_date': u'ca. 1185', 'death_date': u'1245'}
+    cats = [u'13th century philosophers', u'1245 deaths', u'Roman Catholic philosophers', u'English theologians', u'Franciscans', u'Scholastic philosophers', u'People from Gloucestershire']
+    assert date_match(dates, cats)
+
+    dates = {'birth_date': u'1922'}
+    cats = [u'1830 births', u'1876 deaths']
+    assert not date_match(dates, cats)
+
+    dates = {'birth_date': u'1889', 'death_date': u'1947'}
+    cats = [u'1890 births', u'1947 deaths']
+    assert date_match(dates, cats)
+
+    dates = {'birth_date': u'1889', 'death_date': u'1947'}
+    cats = [u'1890 births', u'1947 deaths']
+    assert date_match(dates, cats)
+
+    dates = {}
+    cats = [u'1890 births', u'1947 deaths']
+    assert not date_match(dates, cats)
+
+    dates = {'birth_date': u'1883?', 'death_date': u'1963'}
+    cats = [u'1882 births', u'1963 deaths']
+    assert date_match(dates, cats)
+
+    dates = {'birth_date': u'1328?', 'death_date': u'1369'}
+    cats = [u'Karaite rabbis', u'1320s births', u'1369 deaths']
+    assert date_match(dates, cats)
+
+    dates = {'birth_date': u'ca. 1110', 'death_date': u'ca. 1180'}
+    cats = [u'1120s births', u'1198 deaths']
+    assert date_match(dates, cats)
+
+    # $aAbu Nuwas,$dca. 756-ca. 810.  # Abu Nuwas
+    dates = {'birth_date': u'ca. 756', 'death_date': u'ca. 810'}
+    cats = [u'750 births', u'810 deaths']
+    assert date_match(dates, cats)
+
+re_title_of = re.compile(' (of .*)$')
+
+def name_lookup(c, fields):
+    def join_fields(fields, want):
+        return ' '.join(v for k, v in fields if k in want)
+    if not any(k == 'd' for k, v in fields):
+        return []
+    ab = [v for k, v in fields if k in 'ab']
+    name = ' '.join(ab)
+    flipped = flip_name(name)
+    #names.update([name, flipped])
+    names = set([flipped])
+    if any(k == 'c' for k, v in fields):
+        name = join_fields(fields, 'abc')
+        names.update([name, flip_name(name)])
+        title = [v for k, v in fields if k in 'c']
+        names.update([' '.join(title + ab), ' '.join(title + [flipped])])
+
+        title = ' '.join(title)
+        sp = title.find(' ')
+        if sp != -1:
+            m = re_title_of.search(title)
+            if m:
+                t = m.group(1)
+                names.update([' '.join(ab + [t]), ' '.join([flipped, t])])
+
+            t = title[:sp]
+            names.update([' '.join([t] + ab), ' '.join([t, flipped])])
+
+    found = []
+    names.update(n.replace(',', '') for n in names.copy() if ',' in n)
+    for n in names:
+        c.execute("select title, cats, name, persondata from names, people where people.id = names.person_id and name=%s", (n,))
+        found += c.fetchall()
+    return found
+
+def db_marc_lookup():
+    c = get_cursor()
+    articles = set()
+    count = 0
+    t0 = time()
+    match_count = 0
+    total = 3596802
+    for line in bz2.BZ2File('marc_authors.bz2'):
+        count+=1
+        if count % 1000 == 0:
+            t1 = time() - t0
+            rec_per_sec = count / t1
+            time_left = (total - count) / rec_per_sec
+            print(count, match_count, "%.2f%% %.2f mins left" % ((match_count * 100) / count, time_left / 60))
+        line = eval(line)
+        line = strip_brackets(line)
+        fields = [(k, v.strip(' /,;:')) for k, v in get_subfields(line, 'abcd')]
+        dates = pick_first_date(v for k, v in fields if k == 'd')
+        if dates.items()[0] == ('date', ''):
+            continue
+        found = name_lookup(c, fields)
+        if not found:
+            continue
+        match = {}
+        seen = set()
+#        print fmt_line(get_subfields(line, 'abcd'))
+#        print dates
+        for name, cats, match_name, pd in found:
+            if name in seen:
+                continue
+            seen.add(name)
+            cats = eval(cats)
+            if not any(cat.endswith(' births') or cat.endswith(' deaths') for cat in cats):
+                continue
+            dm = date_match(dates, cats)
+            if dm:
+                match[name] = (cats, match_name)
+            continue
+            print((name, match_name))
+            print("cats =", cats)
+            print(('match' if dm else 'no match'))
+            for field in ['birth', 'death']:
+                print(field + 's:', [i[:-(len(field)+2)] for i in cats if i.endswith(' %ss' % field)], end=' ')
+            print()
+#        print '---'
+
+        if not match:
+            continue
+        match_count+=1
+#        articles.add(match.keys()[0])
+        if len(match) != 1:
+            print(count, match_count)
+            print(fmt_line(get_subfields(line, 'abcd')))
+            for name, (cats, match_name) in match.items():
+                print(name, cats, match_name)
+                print("http://en.wikipedia.org/wiki/" + name.replace(' ', '_'))
+            print()
+        continue
+#        print len(articles), match[0][0], fmt_line(get_subfields(line, 'abcd'))
+        assert len(match) == 1
+    print(match_count)
+
+#test_year_approx_match()
+#db_marc_lookup()
+#test_date_match()
diff --git a/ia-legacy-importer/wikipedia/uniq.py b/ia-legacy-importer/wikipedia/uniq.py
new file mode 100644
index 00000000..95009e6a
--- /dev/null
+++ b/ia-legacy-importer/wikipedia/uniq.py
@@ -0,0 +1,2 @@
+from __future__ import print_function
+print(len(set(eval(l)[1] for l in open('matches2'))))
diff --git a/ia-legacy-importer/works/__init__.py b/ia-legacy-importer/works/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/ia-legacy-importer/works/add_fields_to_works.py b/ia-legacy-importer/works/add_fields_to_works.py
new file mode 100755
index 00000000..b9904434
--- /dev/null
+++ b/ia-legacy-importer/works/add_fields_to_works.py
@@ -0,0 +1,186 @@
+#!/usr/local/bin/python2.5
+from __future__ import print_function
+import sys
+import re
+import codecs
+sys.path.append('/home/edward/src/olapi')
+from olapi import OpenLibrary
+import simplejson as json
+from collections import defaultdict
+from catalog.read_rc import read_rc
+from catalog.utils.query import query, query_iter, set_staging, base_url
+from catalog.utils import mk_norm, get_title
+from six.moves import urllib
+
+import six
+
+
+sys.stdout = codecs.getwriter('utf-8')(sys.stdout)
+set_staging(True)
+
+rc = read_rc()
+
+ol = OpenLibrary(base_url())
+ol.login('EdwardBot', rc['EdwardBot'])
+
+re_year = re.compile('(\d{3,})$')
+
+queue = []
+
+def iter_works(fields):
+    q = { 'type':'/type/work', 'key': None }
+    for f in fields: q[f] = None
+    return query_iter(q)
+
+def dates():
+    global queue
+    f = 'first_publish_date'
+    for w in iter_works([f, 'title']):
+        if f in w:
+            continue
+        q = { 'type':'/type/edition', 'works': w['key'], 'publish_date': None }
+        years = defaultdict(list)
+        for e in query_iter(q):
+            date = e.get('publish_date', None)
+            if not date or date == '0000':
+                continue
+            m = re_year.match(date)
+            if not m:
+                continue
+            year = int(m.group(1))
+            years[year].append(e['key'])
+        if not years:
+            continue
+        first = min(years.keys())
+        assert first != 0
+        print((w['key'], repr(w['title']), first))
+        q = {
+            'key': w['key'],
+            f: { 'connect': 'update', 'value': str(first)}
+        }
+        queue.append(q)
+        if len(queue) == 200:
+            print(ol.write(queue, comment='add first publish date'))
+            queue = []
+    print(ol.write(queue, comment='add first publish date'))
+
+def lang():
+    f = 'original_languages'
+    queue = []
+    for w in iter_works([f, 'title']):
+        if f in w and w[f]:
+            continue
+        q = {
+            'type':'/type/edition',
+            'works': w['key'],
+            'languages': None,
+            'title': None,
+            'title_prefix': None
+        }
+        editions = [e for e in query_iter(q) if e['languages']]
+        title = mk_norm(w['title'])
+        if not editions or any(len(e['languages']) != 1 for e in editions):
+            continue
+        lang = [e['languages'][0]['key'] for e in editions if mk_norm(get_title(e)) == title]
+        if len(lang) < 2:
+            continue
+        first = lang[0]
+        if any(l != first for l in lang):
+            continue
+        print((w['key'], repr(w['title']), first, len(lang)))
+        q = {
+            'key': w['key'],
+            f: { 'connect': 'update_list', 'value': [first]}
+        }
+        queue.append(q)
+        if len(queue) == 200:
+            print(ol.write(queue, comment='add original language'))
+            queue = []
+    print(ol.write(queue, comment='add original language'))
+
+def toc_items(toc_list):
+    return [{'title': item, 'type': '/type/toc_item'} for item in toc_list]
+
+def add_fields():
+    comment = 'add fields to works'
+    queue = []
+    seen = set()
+    fields = ['genres', 'first_sentence', 'dewey_number', \
+            'lc_classifications', 'publish_date'] #, 'table_of_contents']
+    for w in iter_works(fields + ['title']):
+        if w['key'] in seen or all(w.get(f, None) for f in fields):
+            continue
+        seen.add(w['key'])
+        q = { 'type':'/type/edition', 'works': w['key']}
+        for f in fields: q[f] = None
+        editions = list(query_iter(q))
+
+        found = {}
+
+        for f in fields:
+            if not w.get(f, None):
+                if f == 'publish_date':
+                    years = defaultdict(list)
+                    for e in editions:
+                        date = e.get(f, None)
+                        if not date or date == '0000':
+                            continue
+                        m = re_year.match(date)
+                        if not m:
+                            continue
+                        year = int(m.group(1))
+                        years[year].append(e['key'])
+                    if years:
+                        found[f] = str(min(years.keys()))
+                    continue
+                if f == 'genres':
+                    found_list = [[g.strip('.') for g in e[f]] for e in editions \
+                        if e.get(f, None) and not any('translation' in i for i in e[f])]
+                if f == 'table_of_contents':
+                    found_list = []
+                    for e in query_iter(q):
+                        if not e.get(f, None):
+                            continue
+                        toc = e[f]
+                        print(e['key'], toc)
+                        print(e)
+                        print()
+                        if isinstance(toc[0], six.string_types):
+                            found_list.append(toc_items(toc))
+                        else:
+                            assert isinstance(toc[0], dict)
+                            if toc[0]['type'] == '/type/text':
+                                found_list.append(toc_items([i['value'] for i in toc]))
+                            else:
+                                assert toc[0]['type']['key'] == '/type/toc_item'
+                                found_list.append(toc)
+                else:
+                    found_list = [e[f] for e in query_iter(q) if e.get(f, None)]
+                if found_list:
+                    first = found_list[0]
+                    if all(i == first for i in found_list):
+                        found[f] = first
+
+        if not found:
+            continue
+
+        print(len(queue) + 1, w['key'], len(editions), w['title'])
+        print(found)
+
+        q = { 'key': w['key'], }
+        for f in fields:
+            if not f in found:
+                continue
+            if f == 'publish_date':
+                q['first_publish_date'] = { 'connect': 'update', 'value': found[f]}
+            elif f == 'first_sentence':
+                q[f] = { 'connect': 'update', 'value': found[f]}
+            else:
+                q[f] = { 'connect': 'update_list', 'value': found[f]}
+        queue.append(q)
+        if len(queue) == 200:
+            print(ol.write(queue, comment=comment))
+            queue = []
+    print(ol.write(queue, comment=comment))
+
+add_fields()
diff --git a/ia-legacy-importer/works/by_author.py b/ia-legacy-importer/works/by_author.py
new file mode 100755
index 00000000..668d3968
--- /dev/null
+++ b/ia-legacy-importer/works/by_author.py
@@ -0,0 +1,284 @@
+#!/usr/local/bin/python2.5
+from __future__ import print_function
+import re
+import sys
+import codecs
+import web
+from openlibrary.catalog.get_ia import get_from_archive
+from openlibrary.catalog.marc.fast_parse import get_subfield_values, get_first_tag, get_tag_lines, get_subfields
+from openlibrary.catalog.utils.query import query_iter, set_staging, query
+from openlibrary.catalog.utils import cmp, mk_norm
+from openlibrary.catalog.read_rc import read_rc
+from collections import defaultdict
+
+from catalog.utils.edit import fix_edition
+from olapi import OpenLibrary, Reference
+import olapi
+from six.moves import urllib
+
+import six
+
+
+rc = read_rc()
+
+ol = OpenLibrary("http://dev.openlibrary.org")
+ol.login('EdwardBot', rc['EdwardBot'])
+
+sys.stdout = codecs.getwriter('utf-8')(sys.stdout)
+re_skip = re.compile('\b([A-Z]|Co|Dr|Jr|Capt|Mr|Mrs|Ms|Prof|Rev|Revd|Hon|etc)\.$')
+
+base_url = "http://dev.openlibrary.org"
+query_url = base_url + "/query.json?query="
+
+work_num = 184076
+
+set_staging(True)
+
+def withKey(key):
+    url = base_url + key + ".json"
+    return urllib.request.urlopen(url).read()
+
+def find_new_work_key():
+    global work_num
+    while True:
+        key = "/w/OL%dW" % work_num
+        ret = withKey(key)
+        if ret.startswith("Not Found:"):
+            return work_num
+        work_num += 1
+
+def next_work_key():
+    global work_num
+    key = "/w/OL%dW" % work_num
+    ret = withKey(key)
+    while not ret.startswith("Not Found:"):
+        work_num += 1
+        key = "/w/OL%dW" % work_num
+        ret = withKey(key)
+    work_num += 1
+    return key
+
+# sample title: The Dollar Hen (Illustrated Edition) (Dodo Press)
+re_parens = re.compile('^(.*?)(?: \(.+ (?:Edition|Press)\))+$')
+
+def top_rev_wt(d):
+    d_sorted = sorted(d.keys(), cmp=lambda i, j: cmp(d[j], d[i]) or cmp(len(j), len(i)))
+    return d_sorted[0]
+
+def books_query(akey): # live version
+    q = {
+        'type':'/type/edition',
+        'authors': akey,
+        '*': None
+    }
+    return query_iter(q)
+
+def freq_dict_top(d):
+    return sorted(d.keys(), reverse=True, key=lambda i:d[i])[0]
+
+
+def get_work_title(e):
+    if e['key'] not in marc:
+        assert not e.get('work_titles', [])
+        return
+#    assert e.get('work_titles', [])
+    data = marc[e['key']][1]
+    line = get_first_tag(data, set(['240']))
+    if not line:
+        assert not e.get('work_titles', [])
+        return
+    return ' '.join(get_subfield_values(line, ['a'])).strip('. ')
+
+def get_books(akey):
+    for e in books_query(akey):
+        if not e.get('title', None):
+            continue
+        if len(e.get('authors', [])) != 1:
+            continue
+#        if 'works' in e:
+#            continue
+        if 'title_prefix' in e and e['title_prefix']:
+            prefix = e['title_prefix']
+            if prefix[-1] != ' ':
+                prefix += ' '
+            title = prefix + e['title']
+        else:
+            title = e['title']
+
+        title = title.strip(' ')
+        if has_dot(title):
+            title = title[:-1]
+        if title.strip('. ') in ['Publications', 'Works', 'Report', \
+                'Letters', 'Calendar', 'Bulletin', 'Plays', 'Sermons', 'Correspondence']:
+            continue
+
+        m = re_parens.match(title)
+        if m:
+            title = m.group(1)
+
+        n = mk_norm(title)
+
+        book = {
+            'title': title,
+            'norm_title': n,
+            'key': e['key'],
+        }
+
+        if 'languages' in e:
+            book['lang'] = [l['key'][3:] for l in e['languages']]
+
+        if e.get('table_of_contents', None):
+            if isinstance(e['table_of_contents'][0], six.string_types):
+                book['table_of_contents'] = e['table_of_contents']
+            else:
+                assert isinstance(e['table_of_contents'][0], dict)
+                if e['table_of_contents'][0]['type'] == '/type/text':
+                    book['table_of_contents'] = [i['value'] for i in e['table_of_contents']]
+
+        wt = get_work_title(e)
+        if not wt:
+            yield book
+            continue
+        if wt in ('Works', 'Selections'):
+            yield book
+            continue
+        n_wt = mk_norm(wt)
+        book['work_title'] = wt
+        book['norm_wt'] = n_wt
+        yield book
+
+def build_work_title_map(equiv, norm_titles):
+    # map of book titles to work titles
+    title_to_work_title = defaultdict(set)
+    for (norm_title, norm_wt), v in equiv.items():
+        if v != 1:
+            title_to_work_title[norm_title].add(norm_wt)
+
+    title_map = {}
+    for title, v in title_to_work_title.items():
+        if len(v) == 1:
+            title_map[title] = list(v)[0]
+            continue
+        most_common_title = max(v, key=lambda i:norm_titles[i])
+        if title != most_common_title:
+            title_map[title] = most_common_title
+        for i in v:
+            if i != most_common_title:
+                title_map[i] = most_common_title
+    return title_map
+
+def find_works(akey):
+    equiv = defaultdict(int) # title and work title pairs
+    norm_titles = defaultdict(int) # frequency of titles
+    books_by_key = {}
+    books = []
+    rev_wt = defaultdict(lambda: defaultdict(int))
+
+    for book in get_books(akey):
+        if 'norm_wt' in book:
+            pair = (book['norm_title'], book['norm_wt'])
+            equiv[pair] += 1
+            rev_wt[book['norm_wt']][book['work_title']] +=1
+        norm_titles[book['norm_title']] += 1
+        books_by_key[book['key']] = book
+        books.append(book)
+
+    title_map = build_work_title_map(equiv, norm_titles)
+
+    works = defaultdict(lambda: defaultdict(list))
+    work_titles = defaultdict(list)
+    for b in books:
+        if 'eng' not in b.get('lang', []) and 'norm_wt' in b:
+            work_titles[b['norm_wt']].append(b['key'])
+            continue
+        n = b['norm_title']
+        title = b['title']
+        if n in title_map:
+            n = title_map[n]
+            title = top_rev_wt(rev_wt[n])
+        works[n][title].append(b['key'])
+
+    works = sorted([(sum(map(len, w.values() + [work_titles[n]])), n, w) for n, w in works.items()])
+
+    for work_count, norm, w in works:
+        if work_count < 2:
+            continue
+        first = sorted(w.items(), reverse=True, key=lambda i:len(i[1]))[0][0]
+        titles = defaultdict(int)
+        for key_list in w.values():
+            for ekey in key_list:
+                b = books_by_key[ekey]
+                title = b['title']
+                titles[title] += 1
+        keys = work_titles[norm]
+        for values in w.values():
+            keys += values
+        assert work_count == len(keys)
+        title = max(titles.keys(), key=lambda i:titles[i])
+        toc = [(k, books_by_key[k].get('table_of_contents', None)) for k in keys]
+        yield {'title': first, 'editions': keys, 'toc': dict((k, v) for k, v in toc if v)}
+
+def print_works(works):
+    for w in works:
+        print(len(w['editions']), w['title'])
+
+def toc_items(toc_list):
+    return [{'title': six.text_type(item), 'type': Reference('/type/toc_item')} for item in toc_list]
+
+def add_works(akey, works):
+    queue = []
+    for w in works:
+        w['key'] = next_work_key()
+        q = {
+            'authors': [akey],
+            'create': 'unless_exists',
+            'type': '/type/work',
+            'key': w['key'],
+            'title': w['title']
+        }
+        #queue.append(q)
+        print(ol.write(q, comment='create work'))
+        for ekey in w['editions']:
+            e = ol.get(ekey)
+            fix_edition(ekey, e, ol)
+            e['works'] = [Reference(w['key'])]
+            try:
+                ol.save(ekey, e, 'found a work')
+            except olapi.OLError:
+                print(ekey)
+                print(e)
+                raise
+
+def by_authors():
+    find_new_work_key()
+
+    skipping = False
+    skipping = True
+    q = { 'type':'/type/author', 'name': None, 'works': None }
+    for a in query_iter(q, offset=215000):
+        akey = a['key']
+        if skipping:
+            print('skipping:', akey, a['name'])
+            if akey == '/a/OL218496A':
+                skipping = False
+            continue
+
+        q = {
+            'type':'/type/work',
+            'authors': akey,
+        }
+        if query(q):
+            print((akey, repr(a['name']), 'has works'))
+            continue
+
+    #    print akey, a['name']
+        found = find_works(akey)
+        works = [i for i in found if len(i['editions']) > 2]
+        if works:
+            #open('found/' + akey[3:], 'w').write(repr(works))
+            print((akey, repr(a['name'])))
+            #print_works(works)
+            add_works(akey, works)
+            print()
+
+by_authors()
\ No newline at end of file
diff --git a/ia-legacy-importer/works/find.py b/ia-legacy-importer/works/find.py
new file mode 100755
index 00000000..2a54d9ef
--- /dev/null
+++ b/ia-legacy-importer/works/find.py
@@ -0,0 +1,136 @@
+from __future__ import print_function
+import web
+import re
+import sys
+from catalog.read_rc import read_rc
+from catalog.infostore import get_site
+#from catalog.db_read import get_things, withKey
+from catalog.amazon.other_editions import find_others
+
+rc = read_rc()
+
+re_translation_of = re.compile('^Translation of\b[: ]*([^\n]*?)\.?$', re.I | re.M)
+
+site = get_site()
+
+def isbn_link(i):
+    return '<a href="http://wiki-beta.us.archive.org:8081/?isbn=%s">%s</a> (<a href="http://amazon.com/dp/%s">Amazon.com</a>)' % (i, i, i)
+
+def ol_link(key):
+    return '<a href="http://openlibrary.org%s">%s</a></td>' % (key, key)
+
+def search(title, author):
+    q = { 'type': '/type/author', 'name': author }
+    print(q)
+    authors = site.things(q)
+    print(authors)
+    seen = set()
+    pool = set()
+#    for a in authors:
+#        q = { 'type': '/type/edition', 'authors': a, 'title': title }
+#        pool.update(site.things(q))
+    found_titles = {}
+    found_isbn = {}
+    author_keys = ','.join("'%s'" % a for a in authors)
+
+    print(author_keys)
+    iter = web.query("select id, key from thing where thing.id in (select thing_id from edition_ref, thing where edition_ref.key_id=11 and edition_ref.value = thing.id and thing.key in (" + author_keys + "))")
+    key_to_id = {}
+    id_to_key = {}
+    for row in iter:
+        print(row)
+        key_to_id[row.key] = row.id
+        id_to_key[row.id] = row.key
+
+
+    iter = web.query("select thing_id, edition_str.value as title from edition_str where key_id=3 and thing_id in (select thing_id from edition_ref, thing where edition_ref.key_id=11 and edition_ref.value = thing.id and thing.key in (" + author_keys + "))")
+    id_to_title = {}
+    title_to_key = {}
+    for row in iter:
+        print(row)
+        t = row.title.lower().strip('.')
+        id_to_title[row.thing_id] = row.title
+        title_to_key.setdefault(t, []).append(id_to_key[row.thing_id])
+
+    if title.lower() not in title_to_key:
+        print('title not found')
+        return
+
+    pool = set(title_to_key[title.lower()])
+
+    editions = []
+    while pool:
+        key = pool.pop()
+        print(key)
+        seen.add(key)
+        e = site.withKey(key)
+        translation_of = None
+        if e.notes:
+            m = re_translation_of.search(e.notes)
+            if m:
+                translation_of = m.group(1).lower()
+                pool.update(k for k in title_to_key[translation_of] if k not in seen)
+                found_titles.setdefault(translation_of, []).append(key)
+        if e.isbn_10:
+            for i in e.isbn_10:
+                found_isbn.setdefault(i, []).append(key)
+            join_isbn = ', '.join(map(isbn_link, e.isbn_10))
+        else:
+            join_isbn = ''
+        rec = {
+            'key': key,
+            'publish_date': e.publish_date,
+            'publishers': ', '.join(p.encode('utf-8') for p in (e.publishers or [])),
+            'isbn': join_isbn,
+        }
+        editions.append(rec)
+
+        if e.work_titles:
+            for t in e.work_titles:
+                t=t.strip('.')
+                pool.update(k for k in title_to_key.get(t.lower(), []) if k not in seen)
+                found_titles.setdefault(t, []).append(key)
+        if e.other_titles:
+            for t in e.other_titles:
+                t=t.strip('.')
+                pool.update(k for k in title_to_key.get(t.lower(), []) if k not in seen)
+                found_titles.setdefault(t, []).append(key)
+
+    print('<table>')
+    for e in sorted(editions, key=lambda e: e['publish_date'] and e['publish_date'][-4:]):
+        print('<tr>')
+        print('<td>', ol_link(e['key']))
+        print('<td>', e['publish_date'], '</td><td>', e['publishers'], '</td>')
+        print('<td>', e['isbn'], '</td>')
+        print('</tr>')
+    print('</table>')
+
+    if found_titles:
+        print('<h2>Other titles</h2>')
+        print('<ul>')
+        for k, v in found_titles.iteritems():
+            if k == title:
+                continue
+            print('<li><a href="/?title=%s&author=%s">%s</a>' % (k, author, k), end=' ')
+            print('from', ', '.join(ol_link(i) for i in v))
+        print('</ul>')
+
+    extra_isbn = {}
+    for k, v in found_isbn.iteritems():
+        for isbn, note in find_others(k, rc['amazon_other_editions']):
+            if note.lower().find('audio') != -1:
+                continue
+            if isbn not in found_isbn:
+                extra_isbn.setdefault(isbn, []).extend(v)
+
+    if extra_isbn:
+        print('<h2>Other ISBN</h2>')
+        print('<ul>')
+        for k in sorted(extra_isbn):
+            print('<li>', isbn_link(k), end=' ')
+            print('from', ', '.join(ol_link(i) for i in extra_isbn[k]))
+        print('</ul>')
+
+title = 'Journey to the centre of the earth'
+author = 'Jules Verne'
+search(title, author)
diff --git a/ia-legacy-importer/works/find_other_editions.py b/ia-legacy-importer/works/find_other_editions.py
new file mode 100755
index 00000000..be8dfc1a
--- /dev/null
+++ b/ia-legacy-importer/works/find_other_editions.py
@@ -0,0 +1,65 @@
+#!/usr/local/bin/python2.5
+from __future__ import print_function
+import sys
+import codecs
+from catalog.merge.names import match_name
+from catalog.utils import fmt_author, get_title, mk_norm
+from catalog.utils.query import query_iter, set_staging, withKey
+
+# find duplicate authors and other editions of works
+
+sys.stdout = codecs.getwriter('utf-8')(sys.stdout)
+set_staging(True)
+
+def other_editions(title, wkey, work_author):
+    # look for other editions with the same title
+    wakey = work_author['key']
+    q = { 'type': '/type/edition', 'title': title }
+    for k in 'works', 'title_prefix', 'key', 'authors':
+        q[k] = None
+    found = []
+    for e in query_iter(q):
+        if not e.get('authors', None):
+            continue
+        if e.get('works', None) and any(i['key'] == wkey for i in e['works']):
+            continue
+        if any(i['key'] == wakey for i in e['authors']):
+            continue
+        for akey in (a['key'] for a in e.get('authors', [])):
+            a = withKey(akey)
+            name = a.get('name', '')
+            if match_name(name, work_author['name'], last_name_only_ok=True):
+                yield (e, a)
+
+q = { 'type':'/type/work' }
+for k in 'key', 'title', 'authors':
+    q[k] = None
+
+for w in query_iter(q):
+    wkey = w['key']
+    titles = set([w['title']])
+    q = { 'type': '/type/edition', 'works': wkey }
+    for k in 'title', 'title_prefix', 'key', 'authors':
+        q[k] = None
+
+    wakey = w['authors'][0]['key']
+    work_author = withKey(wakey)
+
+    for e in query_iter(q):
+        if not e.get('title', None):
+            continue
+        titles.update([get_title(e), e['title']])
+
+    found = []
+    for title in titles:
+        found += list(other_editions(title, wkey, work_author))
+
+    if not found:
+        continue
+    print(w)
+    print(titles)
+    print(wakey + ':', fmt_author(work_author))
+    for e, a in found:
+        print('  ', a['key'] + ": ", fmt_author(a))
+        print('  ', e)
+    print()
diff --git a/ia-legacy-importer/works/find_work_for_edition.py b/ia-legacy-importer/works/find_work_for_edition.py
new file mode 100644
index 00000000..a108adb1
--- /dev/null
+++ b/ia-legacy-importer/works/find_work_for_edition.py
@@ -0,0 +1,43 @@
+from __future__ import print_function
+# try and find an existing work for a book
+
+from openlibrary.api import OpenLibrary
+from openlibrary.catalog.utils import mk_norm
+import sys
+from time import time
+
+ol = OpenLibrary("http://openlibrary.org")
+
+def find_matching_work(e):
+    norm_title = mk_norm(e['title'])
+
+    seen = set()
+    for akey in e['authors']:
+        q = {
+            'type':'/type/work',
+            'authors': {'author': {'key': akey}},
+            'limit': 0,
+            'title': None,
+        }
+        t0 = time()
+        work_keys = list(ol.query(q))
+        t1 = time() - t0
+        print('time to find books by author: %.1f seconds' % t1)
+        for w in work_keys:
+            wkey = w['key']
+            if wkey in seen:
+                continue
+            seen.add(wkey)
+            if not w.get('title'):
+                continue
+            if mk_norm(w['title']) == norm_title:
+                assert ol.query({'key': wkey, 'type': None})[0]['type'] == '/type/work'
+                return wkey
+
+def test_book():
+    ekey = '/books/OL24335218M'
+    wkey = find_matching_work(ekey)
+    if wkey:
+        print('found match:', wkey)
+    else:
+        print('no match')
diff --git a/ia-legacy-importer/works/find_works.py b/ia-legacy-importer/works/find_works.py
new file mode 100755
index 00000000..cf158cb1
--- /dev/null
+++ b/ia-legacy-importer/works/find_works.py
@@ -0,0 +1,799 @@
+#!/usr/bin/python
+# find works and create pages on production
+
+from __future__ import print_function
+import re
+import simplejson as json
+import sys
+import web
+
+from collections import defaultdict
+from lxml import etree
+from time import sleep, time, strftime
+
+from openlibrary.api import OpenLibrary
+from openlibrary.catalog.get_ia import get_from_archive, get_data
+from openlibrary.catalog.importer.db_read import get_mc
+from openlibrary.catalog.marc.fast_parse import get_subfield_values, get_first_tag, get_tag_lines, get_subfields, BadDictionary
+from openlibrary.catalog.marc.marc_subject import get_work_subjects, four_types
+from openlibrary.catalog.read_rc import read_rc
+from openlibrary.catalog.utils import cmp, mk_norm
+from openlibrary.catalog.utils.edit import fix_edition
+from openlibrary.catalog.utils.query import query_iter, withKey
+from openlibrary.solr.update_work import update_work, solr_update, update_author
+
+import six
+from six.moves import urllib
+from six.moves.urllib.request import urlopen
+
+
+ol = OpenLibrary("http://openlibrary.org")
+
+re_skip = re.compile(r'\b([A-Z]|Co|Dr|Jr|Capt|Mr|Mrs|Ms|Prof|Rev|Revd|Hon|etc)\.$')
+re_work_key = re.compile(r'^/works/OL(\d+)W$')
+re_lang_key = re.compile('^/(?:l|languages)/([a-z]{3})$')
+re_author_key = re.compile(r'^/(?:a|authors)/(OL\d+A)$')
+
+re_ia_marc = re.compile(r'^(?:.*/)?([^/]+)_(marc\.xml|meta\.mrc)(:0:\d+)?$')
+
+ns = '{http://www.loc.gov/MARC21/slim}'
+ns_leader = ns + 'leader'
+ns_data = ns + 'datafield'
+
+def has_dot(s):
+    return s.endswith('.') and not re_skip.search(s)
+
+def get_with_retry(k):
+    for attempt in range(50):
+        try:
+            return ol.get(k)
+        except:
+            pass
+        print('retry')
+        sleep(5)
+    return ol.get()
+
+#set_staging(True)
+
+# sample title: The Dollar Hen (Illustrated Edition) (Dodo Press)
+re_parens = re.compile(r'^(.*?)(?: \(.+ (?:Edition|Press|Print|Plays|Collection|Publication|Novels|Mysteries|Book Series|Classics Library|Classics|Books)\))+$', re.I)
+
+def top_rev_wt(d):
+    d_sorted = sorted(d.keys(), cmp=lambda i, j: cmp(d[j], d[i]) or cmp(len(j), len(i)))
+    return d_sorted[0]
+
+def books_query(akey): # live version
+    q = {
+        'type':'/type/edition',
+        'authors': akey,
+        'source_records': None,
+        'title': None,
+        'work_title': None,
+        'table_of_contents': None,
+        'languages': None,
+        'title_prefix': None,
+        'subtitle': None,
+    }
+    return query_iter(q)
+
+def freq_dict_top(d):
+    return sorted(d.keys(), reverse=True, key=lambda i:d[i])[0]
+
+def get_marc_src(e, mc):
+    if mc and mc.startswith('amazon:'):
+        mc = None
+    if mc and mc.startswith('ia:'):
+        yield 'ia', mc[3:]
+    elif mc:
+        m = re_ia_marc.match(mc)
+        if m:
+            yield 'ia', m.group(1)
+        else:
+            yield 'marc', mc
+    source_records = e.get('source_records', [])
+    if not source_records:
+        return
+    for src in source_records:
+        if src.startswith('ia:'):
+            if not mc or src != mc:
+                yield 'ia', src[3:]
+            continue
+        if src.startswith('marc:'):
+            if not mc or src != 'marc:' + mc:
+                yield 'marc', src[5:]
+            continue
+
+def get_ia_work_title(ia):
+    # FIXME: rewrite to use MARC binary
+    url = 'http://www.archive.org/download/' + ia + '/' + ia + '_marc.xml'
+    try:
+        root = etree.parse(urlopen(url)).getroot()
+    except KeyboardInterrupt:
+        raise
+    except:
+        return
+    e = root.find(ns_data + "[@tag='240']")
+    if e is None:
+        return
+    wt = ' '.join(s.text for s in e if s.attrib['code'] == 'a' and s.text)
+    return wt
+
+def get_work_title(e, mc):
+    # use first work title we find in source MARC records
+    wt = None
+    for src_type, src in get_marc_src(e, mc):
+        if src_type == 'ia':
+            wt = get_ia_work_title(src)
+            if wt:
+                wt = wt.strip('. ')
+            if wt:
+                break
+            continue
+        assert src_type == 'marc'
+        data = None
+        try:
+            data = get_data(src)
+        except ValueError:
+            print('bad record source:', src)
+            print('http://openlibrary.org' + e['key'])
+            continue
+        except urllib.error.HTTPError as error:
+            print('HTTP error:', error.code, error.msg)
+            print(e['key'])
+        if not data:
+            continue
+        is_marc8 = data[9] != 'a'
+        try:
+            line = get_first_tag(data, set(['240']))
+        except BadDictionary:
+            print('bad dictionary:', src)
+            print('http://openlibrary.org' + e['key'])
+            continue
+        if line:
+            wt = ' '.join(get_subfield_values(line, ['a'], is_marc8)).strip('. ')
+            break
+    if wt:
+        return wt
+    for f in 'work_titles', 'work_title':
+        e_wt = e.get(f, [])
+        if e_wt:
+            assert isinstance(e_wt, list)
+            return e_wt[0].strip('. ')
+
+# don't use any of these as work titles
+bad_titles = ['Publications', 'Works. English', 'Missal', 'Works', 'Report', \
+    'Letters', 'Calendar', 'Bulletin', 'Plays', 'Sermons', 'Correspondence', \
+    'Bill', 'Bills', 'Selections', 'Selected works', 'Selected works. English', \
+    'The Novels', 'Laws, etc']
+
+def get_books(akey, query, do_get_mc=True):
+    for e in query:
+        try:
+            if not e.get('title', None):
+                continue
+        except:
+            print(e)
+#        if len(e.get('authors', [])) != 1:
+#            continue
+        if 'title_prefix' in e and e['title_prefix']:
+            prefix = e['title_prefix']
+            if prefix[-1] != ' ':
+                prefix += ' '
+            title = prefix + e['title']
+        else:
+            title = e['title']
+
+        title = title.strip(' ')
+        if has_dot(title):
+            title = title[:-1]
+
+        m = re_parens.match(title)
+        if m:
+            title = m.group(1)
+
+        n = mk_norm(title)
+
+        book = {
+            'title': title,
+            'norm_title': n,
+            'key': e['key'],
+        }
+
+        lang = e.get('languages', [])
+        if lang:
+            book['lang'] = [re_lang_key.match(l['key']).group(1) for l in lang]
+
+        if e.get('table_of_contents', None):
+            if isinstance(e['table_of_contents'][0], six.string_types):
+                book['table_of_contents'] = e['table_of_contents']
+            else:
+                assert isinstance(e['table_of_contents'][0], dict)
+                if e['table_of_contents'][0].get('type', None) == '/type/text':
+                    book['table_of_contents'] = [i['value'] for i in e['table_of_contents']]
+        if 'subtitle' in e:
+            book['subtitle'] = e['subtitle']
+
+        if 'source_records' in e:
+            book['source_records'] = e['source_records']
+
+        mc = get_mc(e['key']) if do_get_mc else None
+        wt = get_work_title(e, mc)
+        if not wt:
+            yield book
+            continue
+        if wt in bad_titles:
+            yield book
+            continue
+        n_wt = mk_norm(wt)
+        book['work_title'] = wt
+        book['norm_wt'] = n_wt
+        yield book
+
+def build_work_title_map(equiv, norm_titles):
+    # map of normalized book titles to normalized work titles
+    if not equiv:
+        return {}
+    title_to_work_title = defaultdict(set)
+    for (norm_title, norm_wt), v in equiv.items():
+        if v != 1:
+            title_to_work_title[norm_title].add(norm_wt)
+
+    title_map = {}
+    for norm_title, work_titles in title_to_work_title.items():
+        if len(work_titles) == 1:
+            title_map[norm_title] = list(work_titles)[0]
+            continue
+        most_common_title = max(work_titles, key=lambda i:norm_titles[i])
+        if norm_title != most_common_title:
+            title_map[norm_title] = most_common_title
+        for work_title in work_titles:
+            if work_title != most_common_title:
+                title_map[work_title] = most_common_title
+    return title_map
+
+def get_first_version(key):
+    url = 'http://openlibrary.org' + key + '.json?v=1'
+    try:
+        return json.load(urlopen(url))
+    except:
+        print(url)
+        raise
+
+def get_existing_works(akey):
+    q = {
+        'type':'/type/work',
+        'authors': {'author': {'key': akey}},
+        'limit': 0,
+    }
+    seen = set()
+    for wkey in ol.query(q):
+        if wkey in seen:
+            continue # skip dups
+        if wkey.startswith('DUP'):
+            continue
+        try:
+            w = get_with_retry(wkey)
+        except:
+            print(wkey)
+            raise
+        if w['type'] in ('/type/redirect', '/type/delete'):
+            continue
+        if w['type'] != '/type/work':
+            print('infobase error, should only return works')
+            print(q)
+            print(w['key'])
+        assert w['type'] == '/type/work'
+        yield w
+
+def find_title_redirects(akey):
+    title_redirects = {}
+    for w in get_existing_works(akey):
+        try:
+            norm_wt = mk_norm(w['title'])
+        except:
+            print(w['key'])
+            raise
+        q = {'type':'/type/redirect', 'location': str(w['key']), 'limit': 0}
+        try:
+            query_iter = ol.query(q)
+        except:
+            print(q)
+            raise
+        for r in map(get_first_version, query_iter):
+            redirect_history = json.load(urlopen('http://openlibrary.org%s.json?m=history' % r['key']))
+            if any(v['author'].endswith('/WorkBot') and v['comment'] == "merge works" for v in redirect_history):
+                continue
+            #print 'redirect:', r
+            if mk_norm(r['title']) == norm_wt:
+                continue
+            if r['title'] in title_redirects:
+                assert title_redirects[r['title']] == w['title']
+            #print 'redirect:', r['key'], r['title'], 'work:', w['key'], w['title']
+            title_redirects[r['title']] = w['title']
+    return title_redirects
+
+def find_works2(book_iter):
+    var = {}
+    var['equiv'] = defaultdict(int) # normalized title and work title pairs
+    var['norm_titles'] = defaultdict(int) # frequency of titles
+    var['books_by_key'] = {}
+    var['books'] = []
+    # normalized work title to regular title
+    var['rev_wt'] = defaultdict(lambda: defaultdict(int))
+
+    for book in book_iter:
+        if 'norm_wt' in book:
+            pair = (book['norm_title'], book['norm_wt'])
+            var['equiv'][pair] += 1
+            var['rev_wt'][book['norm_wt']][book['work_title']] +=1
+        var['norm_titles'][book['norm_title']] += 1 # used to build title_map
+        var['books_by_key'][book['key']] = book
+        var['books'].append(book)
+
+    return var
+
+def find_works3(var, existing={}):
+    title_map = build_work_title_map(var['equiv'], var['norm_titles'])
+
+    for a, b in existing.items():
+        norm_a = mk_norm(a)
+        norm_b = mk_norm(b)
+        var['rev_wt'][norm_b][norm_a] +=1
+        title_map[norm_a] = norm_b
+
+    var['works'] = defaultdict(lambda: defaultdict(list))
+    var['work_titles'] = defaultdict(list)
+    for b in var['books']:
+        if 'eng' not in b.get('lang', []) and 'norm_wt' in b:
+            var['work_titles'][b['norm_wt']].append(b['key'])
+        n = b['norm_title']
+        title = b['title']
+        if n in title_map:
+            n = title_map[n]
+            title = top_rev_wt(var['rev_wt'][n])
+        var['works'][n][title].append(b['key'])
+
+def find_work_sort(var):
+    def sum_len(n, w):
+        # example n: 'magic'
+        # example w: {'magic': ['/books/OL1M', ... '/books/OL4M']}
+        # example work_titles: {'magic': ['/books/OL1M', '/books/OL3M']}
+        return sum(len(i) for i in w.values() + [var['work_titles'][n]])
+    return sorted([(sum_len(n, w), n, w) for n, w in var['works'].items()])
+
+def find_works(book_iter, existing={}, do_get_mc=True):
+
+    var = find_works2(book_iter)
+    find_works3(var, existing)
+
+    works = find_work_sort(var)
+
+    for work_count, norm, w in works:
+        first = sorted(w.items(), reverse=True, key=lambda i:len(i[1]))[0][0]
+        titles = defaultdict(int)
+        for key_list in w.values():
+            for ekey in key_list:
+                b = var['books_by_key'][ekey]
+                title = b['title']
+                titles[title] += 1
+        keys = var['work_titles'][norm]
+        for values in w.values():
+            keys += values
+        assert work_count == len(keys)
+        title = max(titles.keys(), key=lambda i:titles[i])
+        toc_iter = ((k, var['books_by_key'][k].get('table_of_contents', None)) for k in keys)
+        toc = dict((k, v) for k, v in toc_iter if v)
+        # sometimes keys contains duplicates
+        editions = [var['books_by_key'][k] for k in set(keys)]
+        subtitles = defaultdict(lambda: defaultdict(int))
+        edition_count = 0
+        with_subtitle_count = 0
+        for e in editions:
+            edition_count += 1
+            subtitle = e.get('subtitle') or ''
+            if subtitle != '':
+                with_subtitle_count += 1
+            norm_subtitle = mk_norm(subtitle)
+            if norm_subtitle != norm:
+                subtitles[norm_subtitle][subtitle] += 1
+        use_subtitle = None
+        for k, v in subtitles.iteritems():
+            lc_k = k.strip(' .').lower()
+            if lc_k in ('', 'roman') or 'edition' in lc_k:
+                continue
+            num = sum(v.values())
+            overall = float(num) / float(edition_count)
+            ratio = float(num) / float(with_subtitle_count)
+            if overall > 0.2 and ratio > 0.5:
+                use_subtitle = freq_dict_top(v)
+        w = {'title': first, 'editions': editions}
+        if use_subtitle:
+            w['subtitle'] = use_subtitle
+        if toc:
+            w['toc'] = toc
+        try:
+            subjects = four_types(get_work_subjects(w, do_get_mc=do_get_mc))
+        except:
+            print(w)
+            raise
+        if subjects:
+            w['subjects'] = subjects
+        yield w
+
+def print_works(works):
+    for w in works:
+        print(len(w['editions']), w['title'])
+        print('   ', [e['key'] for e in w['editions']])
+        print('   ', w.get('subtitle', None))
+        print('   ', w.get('subjects', None))
+
+
+def books_from_cache():
+    for line in open('book_cache'):
+        yield eval(line)
+
+def add_subjects_to_work(subjects, w):
+    mapping = {
+        'subject': 'subjects',
+        'place': 'subject_places',
+        'time': 'subject_times',
+        'person': 'subject_people',
+    }
+    for k, v in subjects.items():
+        k = mapping[k]
+        subjects = [i[0] for i in sorted(v.items(), key=lambda i:i[1], reverse=True) if i != '']
+        existing_subjects = set(w.get(k, []))
+        w.setdefault(k, []).extend(s for s in subjects if s not in existing_subjects)
+        if w.get(k):
+            w[k] = [six.text_type(i) for i in w[k]]
+        try:
+            assert all(i != '' and not i.endswith(' ') for i in w[k])
+        except AssertionError:
+            print('subjects end with space')
+            print(w)
+            print(subjects)
+            raise
+
+def add_detail_to_work(i, j):
+    if 'subtitle' in i:
+        j['subtitle'] = i['subtitle']
+    if 'subjects' in i:
+        add_subjects_to_work(i['subjects'], j)
+
+def fix_up_authors(w, akey, editions):
+    print('looking for author:', akey)
+    #print (w, akey, editions)
+    seen_akey = False
+    need_save = False
+    for a in w.get('authors', []):
+        print('work:', w['key'])
+        obj = withKey(a['author']['key'])
+        if obj['type']['key'] == '/type/redirect':
+            a['author']['key'] = obj['location']
+            print(obj['key'], 'redirects to', obj['location'])
+            #a['author']['key'] = '/authors/' + re_author_key.match(a['author']['key']).group(1)
+            assert a['author']['key'].startswith('/authors/')
+            obj = withKey(a['author']['key'])
+            assert obj['type']['key'] == '/type/author'
+            need_save = True
+        if akey == a['author']['key']:
+            seen_akey = True
+    if seen_akey:
+        if need_save:
+            print('need save:', a)
+        return need_save
+    try:
+        ekey = editions[0]['key']
+    except:
+        print('editions:', editions)
+        raise
+    #print 'author %s missing. copying from first edition %s' % (akey, ekey)
+    #print 'before:'
+    for a in w.get('authors', []):
+        print(a)
+    e = withKey(ekey)
+    #print e
+    if not e.get('authors', None):
+        print('no authors in edition')
+        return
+    print('authors from first edition', e['authors'])
+    w['authors'] = [{'type':'/type/author_role', 'author':a} for a in e['authors']]
+    #print 'after:'
+    #for a in w['authors']:
+    #    print a
+    return True
+
+def new_work(akey, w, do_updates, fh_log):
+    ol_work = {
+        'title': w['title'],
+        'type': '/type/work',
+        'authors': [{'type':'/type/author_role', 'author': akey}],
+    }
+    add_detail_to_work(w, ol_work)
+    print(ol_work, file=fh_log)
+    if do_updates:
+        for attempt in range(5):
+            try:
+                wkey = ol.new(ol_work, comment='work found')
+                break
+            except:
+                if attempt == 4:
+                    raise
+                print('retrying: %d attempt' % attempt)
+        print('new work:', wkey, repr(w['title']), file=fh_log)
+    else:
+        print('new work:', repr(w['title']), file=fh_log)
+    update = []
+    for e in w['editions']:
+        try:
+            e = ol.get(e['key'])
+        except:
+            print('edition:', e['key'])
+            raise
+        if do_updates:
+            e['works'] = [{'key': wkey}]
+        assert e['type'] == '/type/edition'
+        update.append(e)
+    if do_updates:
+        print(ol.save_many(update, "add editions to new work"), file=fh_log)
+        return [wkey]
+    return []
+
+def fix_toc(e):
+    toc = e.get('table_of_contents')
+    if not toc:
+        return
+    try:
+        if isinstance(toc[0], dict) and toc[0]['type'] == '/type/toc_item':
+            return
+    except:
+        print('toc')
+        print(toc)
+        print(repr(toc))
+    return [{'title': six.text_type(i), 'type': '/type/toc_item'} for i in toc if i]
+
+def update_work_with_best_match(akey, w, work_to_edition, do_updates, fh_log):
+    work_updated = []
+    best = w['best_match']['key']
+    update = []
+    subjects_from_existing_works = defaultdict(set)
+    for wkey in w['existing_works'].iterkeys():
+        if wkey == best:
+            continue
+        existing = get_with_retry(wkey)
+        for k in 'subjects', 'subject_places', 'subject_times', 'subject_people':
+            if existing.get(k):
+                subjects_from_existing_works[k].update(existing[k])
+
+        update.append({'type': '/type/redirect', 'location': best, 'key': wkey})
+        work_updated.append(wkey)
+
+    for wkey in w['existing_works'].iterkeys():
+        editions = set(work_to_edition[wkey])
+        editions.update(e['key'] for e in w['editions'])
+        for ekey in editions:
+            e = get_with_retry(ekey)
+            e['works'] = [{'key': best}]
+            authors = []
+            for akey in e['authors']:
+                a = get_with_retry(akey)
+                if a['type'] == '/type/redirect':
+                    m = re_author_key.match(a['location'])
+                    akey = '/authors/' + m.group(1)
+                authors.append({'key': str(akey)})
+            e['authors'] = authors
+            new_toc = fix_toc(e)
+            if new_toc:
+                e['table_of_contents'] = new_toc
+            update.append(e)
+
+    cur_work = w['best_match']
+    need_save = fix_up_authors(cur_work, akey, w['editions'])
+    if any(subjects_from_existing_works.values()):
+        need_save = True
+    if need_save or cur_work['title'] != w['title'] \
+            or ('subtitle' in w and 'subtitle' not in cur_work) \
+            or ('subjects' in w and 'subjects' not in cur_work):
+        if cur_work['title'] != w['title']:
+            print(( 'update work title:', best, repr(cur_work['title']), '->', repr(w['title'])))
+        existing_work = get_with_retry(best)
+        assert existing_work['type'] == '/type/work', "{type} == '/type/work'".format(**existing_work)
+        existing_work['title'] = w['title']
+        for k, v in subjects_from_existing_works.items():
+            existing_subjects = set(existing_work.get(k, []))
+            existing_work.setdefault(k, []).extend(s for s in v if s not in existing_subjects)
+        add_detail_to_work(w, existing_work)
+        for a in existing_work.get('authors', []):
+            obj = withKey(a['author'])
+            if obj['type']['key'] != '/type/redirect':
+                continue
+            new_akey = obj['location']
+            a['author'] = {'key': new_akey}
+            assert new_akey.startswith('/authors/')
+            obj = withKey(new_akey)
+            assert obj['type']['key'] == '/type/author'
+        print('existing:', existing_work, file=fh_log)
+        print('subtitle:', repr(existing_work['subtitle']) if 'subtitle' in existing_work else 'n/a', file=fh_log)
+        update.append(existing_work)
+        work_updated.append(best)
+    if do_updates:
+        try:
+            print(ol.save_many(update, 'merge works'), file=fh_log)
+        except:
+            for page in update:
+                print(page)
+            raise
+    return work_updated
+
+def update_works(akey, works, do_updates=False):
+    # we can now look up all works by an author
+    if do_updates:
+        rc = read_rc()
+        ol.login('WorkBot', rc['WorkBot'])
+    assert do_updates
+
+    fh_log = open('/1/var/log/openlibrary/work_finder/' + strftime('%F_%T'), 'w')
+    works = list(works)
+    print(akey, file=fh_log)
+    print('works:', file=fh_log)
+
+    while True: # until redirects repaired
+        q = {'type':'/type/edition', 'authors': akey, 'works': None}
+        work_to_edition = defaultdict(set)
+        edition_to_work = defaultdict(set)
+        for e in query_iter(q):
+            if not isinstance(e, dict):
+                continue
+            if e.get('works', None):
+                for w in e['works']:
+                    work_to_edition[w['key']].add(e['key'])
+                    edition_to_work[e['key']].add(w['key'])
+
+        work_by_key = {}
+        fix_redirects = []
+        for k, editions in work_to_edition.items():
+            w = withKey(k)
+            if w['type']['key'] == '/type/redirect':
+                wkey = w['location']
+                print('redirect found', w['key'], '->', wkey, editions, file=fh_log)
+                assert re_work_key.match(wkey)
+                for ekey in editions:
+                    e = get_with_retry(ekey)
+                    e['works'] = [{'key': wkey}]
+                    fix_redirects.append(e)
+                continue
+            work_by_key[k] = w
+        if not fix_redirects:
+            print('no redirects left', file=fh_log)
+            break
+        print('save redirects', file=fh_log)
+        try:
+            ol.save_many(fix_redirects, "merge works")
+        except:
+            for r in fix_redirects:
+                print(r)
+            raise
+
+    all_existing = set()
+    work_keys = []
+    print('edition_to_work:', file=fh_log)
+    print(repr(dict(edition_to_work)), file=fh_log)
+    print(file=fh_log)
+    print('work_to_edition', file=fh_log)
+    print(repr(dict(work_to_edition)), file=fh_log)
+    print(file=fh_log)
+
+#    open('edition_to_work', 'w').write(repr(dict(edition_to_work)))
+#    open('work_to_edition', 'w').write(repr(dict(work_to_edition)))
+#    open('work_by_key', 'w').write(repr(dict(work_by_key)))
+
+    work_title_match = {}
+    works_by_title = {}
+    for w in works: # 1st pass
+        for e in w['editions']:
+            ekey = e['key'] if isinstance(e, dict) else e
+            for wkey in edition_to_work.get(ekey, []):
+                try:
+                    wtitle = work_by_key[wkey]['title']
+                except:
+                    print('bad work:', wkey)
+                    raise
+                if wtitle == w['title']:
+                    work_title_match[wkey] = w['title']
+
+    wkey_to_new_title = defaultdict(set)
+
+    for w in works: # 2nd pass
+        works_by_title[w['title']] = w
+        w['existing_works'] = defaultdict(int)
+        for e in w['editions']:
+            ekey = e['key'] if isinstance(e, dict) else e
+            for wkey in edition_to_work.get(ekey, []):
+                if wkey in work_title_match and work_title_match[wkey] != w['title']:
+                    continue
+                wtitle = work_by_key[wkey]['title']
+                w['existing_works'][wkey] += 1
+                wkey_to_new_title[wkey].add(w['title'])
+
+    existing_work_with_conflict = defaultdict(set)
+
+    for w in works: # 3rd pass
+        for wkey, v in w['existing_works'].iteritems():
+            if any(title != w['title'] for title in wkey_to_new_title[wkey]):
+                w['has_conflict'] = True
+                existing_work_with_conflict[wkey].add(w['title'])
+                break
+
+    for wkey, v in existing_work_with_conflict.iteritems():
+        cur_work = work_by_key[wkey]
+        existing_titles = defaultdict(int)
+        for ekey in work_to_edition[wkey]:
+            e = withKey(ekey)
+            title = e['title']
+            if e.get('title_prefix', None):
+                title = e['title_prefix'].strip() + ' ' + e['title']
+            existing_titles[title] += 1
+        best_match = max(v, key=lambda wt: existing_titles[wt])
+        works_by_title[best_match]['best_match'] = work_by_key[wkey]
+        for wtitle in v:
+            del works_by_title[wtitle]['has_conflict']
+            if wtitle != best_match:
+                works_by_title[wtitle]['existing_works'] = {}
+
+    def other_matches(w, existing_wkey):
+        return [title for title in wkey_to_new_title[existing_wkey] if title != w['title']]
+
+    works_updated_this_session = set()
+
+    for w in works: # 4th pass
+        assert 'has_conflict' not in w, 'w: {}'.format(w)
+        if len(w['existing_works']) == 1:
+            existing_wkey = w['existing_works'].keys()[0]
+            if not other_matches(w, existing_wkey):
+                w['best_match'] = work_by_key[existing_wkey]
+        if 'best_match' in w:
+            updated = update_work_with_best_match(akey, w, work_to_edition, do_updates, fh_log)
+            for wkey in updated:
+                if wkey in works_updated_this_session:
+                    print(wkey, 'already updated!', file=fh_log)
+                    print(wkey, 'already updated!')
+                works_updated_this_session.update(updated)
+            continue
+        if not w['existing_works']:
+            updated = new_work(akey, w, do_updates, fh_log)
+            for wkey in updated:
+                assert wkey not in works_updated_this_session
+                works_updated_this_session.update(updated)
+            continue
+
+        assert not any(other_matches(w, wkey) for wkey in w['existing_works'].iterkeys())
+        best_match = max(w['existing_works'].iteritems(), key=lambda i:i[1])[0]
+        w['best_match'] = work_by_key[best_match]
+        updated = update_work_with_best_match(akey, w, work_to_edition, do_updates, fh_log)
+        for wkey in updated:
+            if wkey in works_updated_this_session:
+                print(wkey, 'already updated!', file=fh_log)
+                print(wkey, 'already updated!')
+        works_updated_this_session.update(updated)
+
+    #if not do_updates:
+    #    return []
+
+    return [withKey(key) for key in works_updated_this_session]
+
+if __name__ == '__main__':
+    akey = '/authors/' + sys.argv[1]
+
+    title_redirects = find_title_redirects(akey)
+    works = find_works(akey, get_books(akey, books_query(akey)), existing=title_redirects)
+    to_update = update_works(akey, works, do_updates=True)
+
+    requests = []
+    for w in to_update:
+        requests += update_work(w)
+
+    if to_update:
+        solr_update(requests + ['<commit />'], debug=True)
+
+    requests = update_author(akey)
+    solr_update(requests + ['<commit/>'], debug=True)
diff --git a/ia-legacy-importer/works/from_sample.py b/ia-legacy-importer/works/from_sample.py
new file mode 100644
index 00000000..397f52b9
--- /dev/null
+++ b/ia-legacy-importer/works/from_sample.py
@@ -0,0 +1,230 @@
+from __future__ import print_function
+import web
+import re
+import sys
+import codecs
+from catalog.marc.fast_parse import *
+from catalog.utils import pick_first_date
+import catalog.marc.new_parser as parser
+
+sys.stdout = codecs.getwriter('utf-8')(sys.stdout)
+
+re_recording = re.compile('\x1f(hsound ?record|[hn] ?\[\[?(sound|video|phonodisc))', re.I)
+re_end_dot = re.compile('[^ ][^ ]\.$', re.UNICODE)
+re_marc_name = re.compile('^(.*), (.*)$')
+
+authors = {}
+family_names = {}
+by_author = {}
+by_contrib = {}
+
+def remove_trailing_dot(s):
+    m = re_end_dot.search(s)
+    if m:
+        s = s[:-1]
+    return s
+
+def strip_q(q):
+    if q.endswith(').'):
+        q = q[:-1]
+    q = q.strip(' ()/,;:')
+    return q
+
+def read(data):
+    want = ['008', '041', '100', '110', '111', '130', '240', '245', '500', '700', '710', '711']
+    fields = get_tag_lines(data, ['006', '008', '245', '260'] + want)
+    seen_008 = False
+    found = []
+    for tag, line in fields:
+        if tag in want:
+            found.append((tag, line))
+        if tag == '006':
+            if line[0] == 'm': # don't want electronic resources
+                return (fields, None)
+            continue
+        if tag == '008':
+            if seen_008: # dup
+                return (fields, None)
+            seen_008 = True
+            continue
+        if tag in ('240', '245', '260'):
+            if re_recording.search(line): # sound recording
+                return (fields, None)
+            continue
+    return (fields, found)
+
+def initials(s):
+    return [i[0] for i in s.split(' ')]
+
+def parse_person(line):
+    contents = get_person_content(line)
+    marc_orig = list(get_all_subfields(line)),
+    if not ('a' in contents or 'c' in contents):
+        return marc_orig, {}
+    assert 'a' in contents or 'c' in contents
+
+    if 'd' in contents:
+        author = pick_first_date(contents['d'])
+    else:
+        author = {}
+    #author['marc_orig'] = list(get_all_subfields(line)),
+    for tag, f in [ ('b', 'numeration'), ('c', 'title') ]:
+        if tag in contents:
+            author[f] = ' '.join(x.strip(' /,;:') for x in contents[tag])
+
+    if 'a' in contents:
+        name = ' '.join(x.strip(' /,;:') for x in contents['a'])
+        name = remove_trailing_dot(name)
+        m = re_marc_name.match(name)
+        if m:
+            author['family_name'] = m.group(1)
+            author['given_names'] = m.group(2)
+            author['name'] = m.group(2) + ' ' + m.group(1)
+        else:
+            author['name'] = name
+    name_subfields = get_subfield_values(line, ['a', 'b', 'c'])
+    author['sort'] = ' '.join(v.strip(' /,;:') for v in name_subfields)
+
+
+    if 'q' in contents:
+        if len(contents['q']) != 1:
+            print(marc_orig)
+        assert len(contents['q']) == 1
+        q = strip_q(contents['q'][0])
+        if 'given_names' in authors:
+            assert initials(q) == initials(author['given_names']) \
+                    or q.startswith(author['given_names'])
+        author['given_names'] = q
+    return marc_orig, author
+
+def test_parse_person():
+    line = '1 \x1faMoeran, E. J.\x1fq(Ernest John)\x1fq(1894-1950)\x1e'
+    person = ([('a', u'Moeran, E. J.'), ('q', u'(Ernest John)'), ('q', u'(1894-1950)')],)
+    parse_person(line)
+
+#test_parse_person()
+
+def full_title(line):
+    title = ' '.join(v for k, v in line if k in ('a', 'b')).strip(' /,;:')
+    return remove_trailing_dot(title)
+
+def test_strip_q():
+    for i in ['(%s),', '(%s)', '(%s,']:
+        k = i % ('foo')
+        j = strip_q(k)
+        print(k, j)
+        assert j == 'foo'
+
+    name = 'John X.'
+    assert name == strip_q('(%s)' % name)
+
+def print_author(a):
+    for k in ('name', 'sort', 'numeration', 'title', 'given_names', 'family_name', 'birth_date', 'death_date'):
+        print("%12s: %s" % (k, author.get(k, '')))
+
+
+def person_as_tuple(p):
+    return tuple(p.get(i, None) for i in ('sort', 'birth_date', 'death_date'))
+
+def family_name(a):
+    if 'family_name' not in a:
+        return
+    this = a['family_name']
+    family_names.setdefault(this, {})
+    as_tuple = tuple(a.get(i, None) for i in ('sort', 'birth_date', 'death_date'))
+    as_tuple = person_as_tuple(a)
+    family_names[this][as_tuple] = family_names[this].get(as_tuple, 0) + 1
+
+interested = set(['Rowling', 'Shakespeare', 'Sagan', 'Darwin', 'Verne', 'Beckett', 'Churchill', 'Dickens', 'Twain', 'Doyle'])
+sorted_interest = sorted(interested)
+
+def edition_list(l):
+    for e in l:
+        print(e['loc'])
+        for k in sorted((k for k in e.keys() if k.isdigit()), key=int):
+            if k == '245':
+                t = ' '.join(v.strip(' /,;:') for k, v in e[k][0] if k == 'a')
+                title = remove_trailing_dot(t)
+                full = full_title(e[k][0])
+                print('     title:', title)
+                if title != full:
+                    print('full title:', full)
+            print('    ', k, e[k])
+        print('---')
+
+def print_interest():
+    for k in sorted_interest:
+        if k not in family_names:
+            continue
+        print(k)
+        for a in sorted(family_names[k].keys()):
+            if family_names[k][a] > 5:
+                print("  %3d %s" % (family_names[k][a], a))
+                if a in by_author:
+                    print("  by: ")
+                    for i in sorted(by_author[a].keys()):
+                        print(' WORK: %s (%d)' % (i, len(by_author[a][i])))
+                        edition_list(by_author[a][i])
+#                if a in by_contrib:
+#                    print "  contrib: "
+#                    edition_list(by_contrib[a])
+    print()
+
+def work_title(edition):
+    if '240' in edition:
+        t = ' '.join(v for k, v in edition['240'][0] if k in ('a', 'm', 'n', 'p', 'r'))
+    else:
+        t = ' '.join(v.strip(' /,;:') for k, v in edition['245'][0] if k == 'a')
+    return remove_trailing_dot(t)
+
+#for line in open(sys.argv[1]):
+for line in sys.stdin:
+    loc, data = eval(line)
+    (orig_fields, fields) = read(data)
+    if not fields:
+        continue
+    new_interest = False
+    edition = {}
+    for tag, l in fields:
+        #if tag in ('100', '700'):
+        if tag == '100':
+            try:
+                marc, person = parse_person(l)
+            except:
+                print(loc)
+                raise
+            if not person:
+                continue
+            #print author['marc_orig']
+#            print marc
+            if person.get('family_name', None) in interested:
+#                family_name(person)
+                new_interest = True
+#            print_author(author)
+            continue
+            tag_map = { '100': 'authors', '700': 'contribs' }
+            person['marc'] = marc
+            edition.setdefault(tag_map[tag], []).append(person)
+        continue
+        if tag == '008':
+            lang = str(l)[35:38]
+            edition['lang'] = lang
+            continue
+        edition.setdefault(tag, []).append(list(get_all_subfields(line)))
+    #for k in sorted(family_names.keys()):
+
+    if new_interest:
+        edition['loc'] = loc
+        print((loc, data))
+        continue
+        title = work_title(edition)
+#        rec = parser.read_edition(loc, data)
+        for p in edition.get('authors', []):
+            a = by_author.setdefault(person_as_tuple(p), {})
+            a.setdefault(title, []).append(edition)
+#        for p in edition.get('contribs', []):
+#            by_contrib.setdefault(person_as_tuple(p), []).append(edition)
+for k, v in by_author.items():
+    print((k, v))
+#print_interest()
+
diff --git a/ia-legacy-importer/works/live.py b/ia-legacy-importer/works/live.py
new file mode 100755
index 00000000..35c3a67e
--- /dev/null
+++ b/ia-legacy-importer/works/live.py
@@ -0,0 +1,474 @@
+#!/usr/bin/python
+
+# find works and create pages on production
+
+from __future__ import print_function
+import re
+import sys
+import codecs
+import web
+from openlibrary.catalog.get_ia import get_from_archive, get_data
+from openlibrary.catalog.marc.fast_parse import get_subfield_values, get_first_tag, get_tag_lines, get_subfields, BadDictionary
+from openlibrary.catalog.utils.query import query_iter, set_staging, query
+from openlibrary.catalog.utils import cmp, mk_norm
+from openlibrary.catalog.read_rc import read_rc
+from collections import defaultdict
+from pprint import pformat
+from openlibrary.catalog.utils.edit import fix_edition
+from openlibrary.catalog.importer.db_read import get_mc
+from openlibrary.api import OpenLibrary, Reference
+from lxml import etree
+from time import sleep, time
+
+import six
+from six.moves import urllib
+
+
+rc = read_rc()
+
+ol = OpenLibrary("http://openlibrary.org")
+ol.login('WorkBot', rc['WorkBot'])
+
+def write_log(cat, key, title):
+    print((("%.2f" % time()), cat, key, title), file=fh_log)
+    fh_log.flush()
+
+sys.stdout = codecs.getwriter('utf-8')(sys.stdout)
+re_skip = re.compile('\b([A-Z]|Co|Dr|Jr|Capt|Mr|Mrs|Ms|Prof|Rev|Revd|Hon|etc)\.$')
+
+re_ia_marc = re.compile('^(?:.*/)?([^/]+)_(marc\.xml|meta\.mrc)(:0:\d+)?$')
+
+ns = '{http://www.loc.gov/MARC21/slim}'
+ns_leader = ns + 'leader'
+ns_data = ns + 'datafield'
+
+def has_dot(s):
+    return s.endswith('.') and not re_skip.search(s)
+
+#set_staging(True)
+
+# sample title: The Dollar Hen (Illustrated Edition) (Dodo Press)
+re_parens = re.compile('^(.*?)(?: \(.+ (?:Edition|Press)\))+$')
+
+def key_int(key):
+    # extract the number from a key like /a/OL1234A
+    return int(web.numify(key))
+
+def update_work_edition(ekey, wkey, use):
+    print((ekey, wkey, use))
+    e = ol.get(ekey)
+    works = []
+    for w in e['works']:
+        if w == wkey:
+            if use not in works:
+                works.append(Reference(use))
+        else:
+            if w not in works:
+                works.append(w)
+
+    if e['works'] == works:
+        return
+    print('before:', e['works'])
+    print('after:', works)
+    e['works'] = works
+    print(ol.save(e['key'], e, 'remove duplicate work page'))
+
+def top_rev_wt(d):
+    d_sorted = sorted(d.keys(), cmp=lambda i, j: cmp(d[j], d[i]) or cmp(len(j), len(i)))
+    return d_sorted[0]
+
+def books_query(akey): # live version
+    q = {
+        'type':'/type/edition',
+        'authors': akey,
+        'source_records': None,
+        'title': None,
+        'work_title': None,
+        'languages': None,
+        'title_prefix': None,
+        'subtitle': None,
+    }
+    return query_iter(q)
+
+def freq_dict_top(d):
+    return sorted(d.keys(), reverse=True, key=lambda i:d[i])[0]
+
+def get_marc_src(e):
+    mc = get_mc(e['key'])
+    if mc and mc.startswith('amazon:'):
+        mc = None
+    if mc and mc.startswith('ia:'):
+        yield 'ia', mc[3:]
+    elif mc:
+        m = re_ia_marc.match(mc)
+        if m:
+            #print 'IA marc match:', m.group(1)
+            yield 'ia', m.group(1)
+        else:
+            yield 'marc', mc
+    source_records = e.get('source_records', [])
+    if not source_records:
+        return
+    for src in source_records:
+        if src.startswith('ia:'):
+            if not mc or src != mc:
+                yield 'ia', src[3:]
+            continue
+        if src.startswith('marc:'):
+            if not mc or src != 'marc:' + mc:
+                yield 'marc', src[5:]
+            continue
+
+def get_ia_work_title(ia):
+    url = 'http://www.archive.org/download/' + ia + '/' + ia + '_marc.xml'
+    try:
+        root = etree.parse(urllib.request.urlopen(url)).getroot()
+    except KeyboardInterrupt:
+        raise
+    except:
+        #print 'bad XML', ia
+        #print url
+        return
+    #print etree.tostring(root)
+    e = root.find(ns_data + "[@tag='240']")
+    if e is None:
+        return
+    #print e.tag
+    wt = ' '.join(s.text for s in e if s.attrib['code'] == 'a' and s.text)
+    return wt
+
+def get_work_title(e):
+    # use first work title we find in source MARC records
+    wt = None
+    for src_type, src in get_marc_src(e):
+        if src_type == 'ia':
+            wt = get_ia_work_title(src)
+            if wt:
+                break
+            continue
+        assert src_type == 'marc'
+        data = None
+        #print 'get from archive:', src
+        try:
+            data = get_data(src)
+        except ValueError:
+            print('bad record source:', src)
+            print('http://openlibrary.org' + e['key'])
+            continue
+        except urllib.error.HTTPError as error:
+            print('HTTP error:', error.code, error.msg)
+            print(e['key'])
+        if not data:
+            continue
+        try:
+            line = get_first_tag(data, set(['240']))
+        except BadDictionary:
+            print('bad dictionary:', src)
+            print('http://openlibrary.org' + e['key'])
+            continue
+        if line:
+            wt = ' '.join(get_subfield_values(line, ['a'])).strip('. ')
+            break
+    if wt:
+        return wt
+    if not e.get('work_titles', []):
+        return
+    print('work title in MARC, but not in OL')
+    print('http://openlibrary.org' + e['key'])
+    return e['work_titles'][0]
+
+def get_books(akey, query):
+    for e in query:
+        if not e.get('title', None):
+            continue
+#        if len(e.get('authors', [])) != 1:
+#            continue
+        if 'title_prefix' in e and e['title_prefix']:
+            prefix = e['title_prefix']
+            if prefix[-1] != ' ':
+                prefix += ' '
+            title = prefix + e['title']
+        else:
+            title = e['title']
+
+        title = title.strip(' ')
+        if has_dot(title):
+            title = title[:-1]
+        if title.strip('. ') in ['Publications', 'Works', 'Report', \
+                'Letters', 'Calendar', 'Bulletin', 'Plays', 'Sermons', 'Correspondence']:
+            continue
+
+        m = re_parens.match(title)
+        if m:
+            title = m.group(1)
+
+        n = mk_norm(title)
+
+        book = {
+            'title': title,
+            'norm_title': n,
+            'key': e['key'],
+        }
+
+        lang = e.get('languages', [])
+        if lang:
+            book['lang'] = [l['key'][3:] for l in lang]
+
+        if e.get('table_of_contents', None):
+            if isinstance(e['table_of_contents'][0], six.string_types):
+                book['table_of_contents'] = e['table_of_contents']
+            else:
+                assert isinstance(e['table_of_contents'][0], dict)
+                if e['table_of_contents'][0]['type'] == '/type/text':
+                    book['table_of_contents'] = [i['value'] for i in e['table_of_contents']]
+
+        wt = get_work_title(e)
+        if not wt:
+            yield book
+            continue
+        if wt in ('Works', 'Selections'):
+            yield book
+            continue
+        n_wt = mk_norm(wt)
+        book['work_title'] = wt
+        book['norm_wt'] = n_wt
+        yield book
+
+def build_work_title_map(equiv, norm_titles):
+    # map of book titles to work titles
+    title_to_work_title = defaultdict(set)
+    for (norm_title, norm_wt), v in equiv.items():
+        if v != 1:
+            title_to_work_title[norm_title].add(norm_wt)
+
+    title_map = {}
+    for title, v in title_to_work_title.items():
+        if len(v) == 1:
+            title_map[title] = list(v)[0]
+            continue
+        most_common_title = max(v, key=lambda i:norm_titles[i])
+        if title != most_common_title:
+            title_map[title] = most_common_title
+        for i in v:
+            if i != most_common_title:
+                title_map[i] = most_common_title
+    return title_map
+
+def find_works(akey, book_iter):
+    equiv = defaultdict(int) # title and work title pairs
+    norm_titles = defaultdict(int) # frequency of titles
+    books_by_key = {}
+    books = []
+    rev_wt = defaultdict(lambda: defaultdict(int))
+
+    for book in book_iter:
+        if 'norm_wt' in book:
+            pair = (book['norm_title'], book['norm_wt'])
+            equiv[pair] += 1
+            rev_wt[book['norm_wt']][book['work_title']] +=1
+        norm_titles[book['norm_title']] += 1
+        books_by_key[book['key']] = book
+        books.append(book)
+
+    title_map = build_work_title_map(equiv, norm_titles)
+
+    works = defaultdict(lambda: defaultdict(list))
+    work_titles = defaultdict(list)
+    for b in books:
+        if 'eng' not in b.get('lang', []) and 'norm_wt' in b:
+            work_titles[b['norm_wt']].append(b['key'])
+            continue
+        n = b['norm_title']
+        title = b['title']
+        if n in title_map:
+            n = title_map[n]
+            title = top_rev_wt(rev_wt[n])
+        works[n][title].append(b['key'])
+
+    works = sorted([(sum(map(len, w.values() + [work_titles[n]])), n, w) for n, w in works.items()])
+
+    for work_count, norm, w in works:
+#        if work_count < 2:
+#            continue
+        first = sorted(w.items(), reverse=True, key=lambda i:len(i[1]))[0][0]
+        titles = defaultdict(int)
+        for key_list in w.values():
+            for ekey in key_list:
+                b = books_by_key[ekey]
+                title = b['title']
+                titles[title] += 1
+        keys = work_titles[norm]
+        for values in w.values():
+            keys += values
+        assert work_count == len(keys)
+        title = max(titles.keys(), key=lambda i:titles[i])
+        toc = [(k, books_by_key[k].get('table_of_contents', None)) for k in keys]
+        yield {'title': first, 'editions': keys, 'toc': dict((k, v) for k, v in toc if v)}
+
+def print_works(works):
+    for w in works:
+        print(len(w['editions']), w['title'])
+
+def toc_items(toc_list):
+    return [{'title': six.text_type(item), 'type': Reference('/type/toc_item')} for item in toc_list]
+
+def add_works(works):
+    q = []
+    for w in works:
+        cur = {
+            'authors': [{'author': Reference(w['author'])}],
+            'type': '/type/work',
+            'title': w['title']
+        }
+        if 'subjects' in w:
+            cur['subjects'] = w['subjects']
+        q.append(cur)
+    try:
+        return ol.new(q, comment='create work page')
+    except:
+        print(q)
+        raise
+
+def add_work(akey, w):
+    q = {
+        'authors': [{'author': Reference(akey)}],
+        'type': '/type/work',
+        'title': w['title']
+    }
+    try:
+        wkey = ol.new(q, comment='create work page')
+    except:
+        print(q)
+        raise
+    write_log('work', wkey, w['title'])
+    assert isinstance(wkey, six.string_types)
+    for ekey in w['editions']:
+        e = ol.get(ekey)
+        fix_edition(ekey, e, ol)
+        #assert 'works' not in e
+        write_log('edition', ekey, e.get('title', 'title missing'))
+        e['works'] = [Reference(wkey)]
+        yield e
+
+def save_editions(queue):
+    print('saving')
+    try:
+        print(ol.save_many(queue, 'add edition to work page'))
+    except:
+        print('ol.save_many() failed, trying again in 30 seconds')
+        sleep(30)
+        print(ol.save_many(queue, 'add edition to work page'))
+    print('saved')
+
+def merge_works(work_keys):
+    use = "/works/OL%dW" % min(key_int(w) for w in work_keys)
+    for wkey in work_keys:
+        if wkey == use:
+            continue
+        w_query = {'type':'/type/edition', 'works':wkey, 'limit':False}
+        for e in ol.query(w_query): # returns strings?
+            print(e)
+            update_work_edition(e, wkey, use)
+        w = ol.get(wkey)
+        assert w['type'] == '/type/work'
+        w['type'] = '/type/redirect'
+        w['location'] = use
+        print(ol.save(wkey, w, 'delete duplicate work page'))
+
+def update_edition(ekey, wkey):
+    e = ol.get(ekey)
+    fix_edition(ekey, e, ol)
+    write_log('edition', ekey, e.get('title', 'title missing'))
+    if e.get('works', []):
+        assert len(e['works']) == 1
+        if e['works'][0] != wkey:
+            print('e:', e)
+            print('wkey:', wkey)
+            print('ekey:', ekey)
+            print('e["works"]:', e['works'])
+            #merge_works([e['works'][0], wkey])
+        #assert e['works'][0] == wkey
+        return None
+    e['works'] = [Reference(wkey)]
+    return e
+
+def run_queue(queue):
+    work_keys = add_works(queue)
+    for w, wkey in zip(queue, work_keys):
+        w['key'] = wkey
+        write_log('work', wkey, w['title'])
+        for ekey in w['editions']:
+            e = update_edition(ekey, wkey)
+            if e:
+                yield e
+
+def get_work_key(title, akey):
+    q = {
+        'type': '/type/work',
+        'title': title,
+        'authors': None,
+    }
+    matches = [w for w in ol.query(q) if any(a['author'] == akey for a in w['authors'])]
+    if not matches:
+        return None
+    if len(matches) != 1:
+        print('time to fix duplicate works')
+        print(repr(title))
+        print('http://openlibrary.org' + akey)
+        print(matches)
+    assert len(matches) == 1
+    return matches[0]['key']
+
+def by_authors():
+    skip = '/a/OL25755A'
+    q = { 'type':'/type/author', 'name': None }
+    for a in query_iter(q):
+        akey = a['key']
+        if skip:
+            if akey == skip:
+                skip = None
+            else:
+                continue
+        write_log('author', akey, a.get('name', 'name missing'))
+
+        works = find_works(akey, get_books(akey, books_query(akey)))
+        print((akey, repr(a['name'])))
+
+        for w in works:
+            w['author'] = akey
+            wkey = get_work_key(w['title'], akey)
+            if wkey:
+                w['key'] = wkey
+            yield w
+
+if __name__ == '__main__':
+    fh_log = open('/1/edward/logs/WorkBot', 'a')
+    edition_queue = []
+    work_queue = []
+
+    for w in by_authors():
+        if 'key' in w:
+            for ekey in w['editions']:
+                e = update_edition(ekey, w['key'])
+                if e:
+                    edition_queue.append(e)
+            continue
+
+        work_queue.append(w)
+        if len(work_queue) > 1000:
+            for e in run_queue(work_queue):
+                print(e['key'], repr(e['title']))
+                edition_queue.append(e)
+                if len(edition_queue) > 1000:
+                    save_editions(edition_queue)
+                    edition_queue = []
+                    sleep(5)
+            work_queue = []
+
+    print('almost finished')
+    for e in run_queue(work_queue):
+        edition_queue.append(e)
+    save_editions(edition_queue)
+    print('finished')
+
+    fh_log.close()
diff --git a/ia-legacy-importer/works/load_to_staging.py b/ia-legacy-importer/works/load_to_staging.py
new file mode 100644
index 00000000..d5046826
--- /dev/null
+++ b/ia-legacy-importer/works/load_to_staging.py
@@ -0,0 +1,47 @@
+from __future__ import print_function
+import sys
+sys.path.remove('/usr/local/lib/python2.5/site-packages/web.py-0.23-py2.5.egg')
+from staging_save import Infogami
+from catalog.read_rc import read_rc
+import catalog.importer.db_read as db_read
+import re
+import sys
+import codecs
+
+db_read.set_staging(True)
+
+sys.stdout = codecs.getwriter('utf-8')(sys.stdout)
+
+rc = read_rc()
+infogami = Infogami()
+infogami.login('edward', rc['edward'])
+
+for line in open('works_for_staging'):
+    work_key, title, authors, editions = eval(line)
+    if not all(db_read.withKey('/a/' + a) for a in authors):
+        continue
+    work = db_read.withKey(work_key)
+    print(work_key)
+    if work:
+        continue
+    if not work:
+        q = {
+            'create': 'unless_exists',
+            'type': { 'key': '/type/work' },
+            'key': work_key,
+            'title': title,
+            'authors': [{'key': '/a/' + a} for a in authors],
+        }
+        ret = infogami.write(q, comment='create work')
+        print(ret)
+    for edition_key in editions:
+        edition = db_read.withKey(edition_key)
+        if not edition: continue
+        if 'works' in edition: continue
+        q = {
+            'key': edition_key,
+            'works': { 'connect': 'update_list', 'value': [{'key': work_key}]}
+        }
+        ret = infogami.write(q, comment='add work to edition')
+        print(edition_key, ret)
+        assert ret['result']['updated']
diff --git a/ia-legacy-importer/works/sample_marc.py b/ia-legacy-importer/works/sample_marc.py
new file mode 100644
index 00000000..cf2f1c81
--- /dev/null
+++ b/ia-legacy-importer/works/sample_marc.py
@@ -0,0 +1,19 @@
+from __future__ import print_function
+from catalog.marc.all import iter_marc
+import re
+
+# random authors and subjects
+terms = [
+    'rowling', 'harry potter', 'shakespeare', 'hamlet', 'twain', 'darwin',
+    'sagan', 'huckleberry finn', 'tom sawyer', 'verne', 'waiting for godot',
+    'beckett', 'churchill', 'darwin', 'dickens', 'doyle', 'leonardo',
+    'da vinci',
+]
+
+re_terms = re.compile('(' + '|'.join(terms) + ')', re.I)
+
+out = open('/1/pharos/edward/sample_marc2', 'w')
+for rec_no, pos, loc, data in iter_marc():
+    if re_terms.search(data):
+        print((loc, data), file=out)
+out.close()
diff --git a/ia-legacy-importer/works/test_find_works.py b/ia-legacy-importer/works/test_find_works.py
new file mode 100644
index 00000000..1f82cae7
--- /dev/null
+++ b/ia-legacy-importer/works/test_find_works.py
@@ -0,0 +1,147 @@
+# -*- coding: utf-8 -*-
+from openlibrary.catalog.merge.normalize import normalize
+from openlibrary.catalog.works.find_works import top_rev_wt, has_dot, freq_dict_top, find_works, get_books, find_works2, build_work_title_map, find_works3, find_work_sort
+
+
+def test_has_dot():
+    assert has_dot('Magic.')
+    assert not has_dot('Magic')
+    assert not has_dot('Magic etc.')
+
+def test_top_rev_wt():
+    input_data = {
+        'aaa': 'test data',
+        'aaaa': 'more test data',
+        'bbbb': 'test date',
+        'cc': 'some more test data',
+    }
+    assert top_rev_wt(input_data) == 'bbbb'
+
+def test_freq_dict_top():
+    assert freq_dict_top({'a': 0}) == 'a'
+    assert freq_dict_top({'a': 3, 'b': 6, 'c': 4}) == 'b'
+
+def test_find_works():
+    works = list(find_works([]))
+    assert works == []
+
+    books = [{'title': 'Magic', 'key': '/books/OL1M'}]
+    book_iter = get_books('', books, do_get_mc=False)
+
+    books2 = list(book_iter)
+    assert books2 == [{'key': '/books/OL1M', 'norm_title': 'magic', 'title': 'Magic'}]
+
+    var = find_works2(books2)
+    assert var['equiv'] == {}
+    assert var['norm_titles'] == {'magic': 1}
+    assert var['books_by_key'] == {'/books/OL1M': books2[0]}
+    assert var['books'] == books2
+    assert var['rev_wt'] == {}
+
+    assert build_work_title_map({}, {'magic': 1}) == {}
+    assert build_work_title_map({}, {'magic': 2, 'test': 0}) == {}
+
+    works = list(find_works(books2, do_get_mc=False))
+    expect = [
+    { 'title': 'Magic',
+        'editions': [{
+        'key': '/books/OL1M',
+        'norm_title': 'magic',
+        'title': 'Magic'}],
+    }]
+    assert works == expect
+
+
+    books = [
+        {'title': 'Magic', 'key': '/books/OL1M'},
+        {'title': 'Magic', 'key': '/books/OL2M'},
+    ]
+    book_iter = get_books('', books, do_get_mc=False)
+    books2 = list(book_iter)
+
+    var = find_works2(books2)
+    assert var['equiv'] == {}
+    assert var['norm_titles'] == {'magic': 2}
+    assert var['books_by_key'] == {'/books/OL1M': books2[0], '/books/OL2M': books2[1]}
+    assert var['books'] == books2
+    assert var['rev_wt'] == {}
+
+    works = list(find_works(books2, do_get_mc=False))
+    expect = [
+    { 'title': 'Magic',
+        'editions': [
+            { 'key': '/books/OL1M', 'norm_title': 'magic', 'title': 'Magic'},
+            { 'key': '/books/OL2M', 'norm_title': 'magic', 'title': 'Magic'},
+        ],
+    }]
+    assert works == expect
+
+    magico = u'm\xe1gico'
+
+    assert normalize(magico) == magico
+
+    books = [
+        {'title': magico, 'work_title': ['magic'], 'key': '/books/OL1M'},
+        {'title': 'magic', 'key': '/books/OL2M'},
+        {'title': magico, 'work_title': ['magic'], 'key': '/books/OL3M'},
+        {'title': 'magic', 'key': '/books/OL4M'},
+    ]
+    expect_keys = sorted(e['key'] for e in books)
+    book_iter = get_books('', books, do_get_mc=False)
+    books2 = list(book_iter)
+
+    expect = [
+        {'key': '/books/OL1M', 'norm_title': magico, 'work_title': 'magic', 'norm_wt': 'magic', 'title': magico},
+        {'key': '/books/OL2M', 'norm_title': 'magic', 'title': 'magic'},
+        {'key': '/books/OL3M', 'norm_title': magico, 'work_title': 'magic', 'norm_wt': 'magic', 'title': magico},
+        {'key': '/books/OL4M', 'norm_title': 'magic', 'title': 'magic'},
+    ]
+
+    assert len(books2) == 4
+    for i in range(4):
+        assert books2[i] == expect[i]
+
+    var = find_works2(books2)
+    assert var['equiv'] == {(magico, 'magic'): 2}
+    assert var['norm_titles'] == {magico: 2, 'magic': 2}
+    assert len(var['books_by_key']) == 4
+    bk = var['books_by_key']
+    assert bk['/books/OL1M'] == books2[0]
+    assert bk['/books/OL2M'] == books2[1]
+    assert bk['/books/OL3M'] == books2[2]
+    assert bk['/books/OL4M'] == books2[3]
+    assert var['books'] == books2
+    assert var['rev_wt'] == {'magic': {'magic': 2}}
+
+    title_map = build_work_title_map(var['equiv'], var['norm_titles'])
+
+    assert title_map == {magico: 'magic'}
+
+    find_works3(var)
+    assert var['works'] == {'magic': {'magic': expect_keys}}
+    assert var['work_titles'] == {'magic': ['/books/OL1M', '/books/OL3M']}
+
+    sorted_works = find_work_sort(var)
+    assert sorted_works == [(6, 'magic', {'magic': expect_keys})]
+
+    works = list(find_works(books2, do_get_mc=False))
+    expect = [{
+        'title': u'Magic',
+        'editions': [
+            {'key': '/books/OL2M', 'norm_title': 'magic', 'title': 'magic'},
+            {'key': '/books/OL1M', 'norm_title': u'mágico', 'norm_wt': 'magic', 'title': u'Mágico'},
+        ],
+    }]
+
+    work_count = len(works)
+    assert work_count == 1
+    editions = works[0]['editions']
+    edition_count = len(works[0]['editions'])
+    edition_keys = sorted(e['key'] for e in editions)
+    assert edition_keys == expect_keys
+    assert edition_count == 4
+    del works[0]['editions']
+    assert works[0] == {'title': 'magic'}
+    #assert works == expect
+
+
diff --git a/ia-legacy-importer/works/tests.py b/ia-legacy-importer/works/tests.py
new file mode 100644
index 00000000..059afa7b
--- /dev/null
+++ b/ia-legacy-importer/works/tests.py
@@ -0,0 +1,143 @@
+from __future__ import print_function
+from collections import defaultdict
+import re
+import catalog.merge.normalize as merge
+
+def freq_dict_top(d):
+    return sorted(d.keys(), reverse=True, key=lambda i:d[i])[0]
+
+re_brackets = re.compile('^(.*)\[.*?\]$')
+re_parens = re.compile('^(.*?)(?: \(.+ (?:Edition|Press)\))+$')
+
+def mk_norm(title):
+    m = re_brackets.match(title)
+    if m:
+        title = m.group(1)
+    norm = merge.normalize(title).strip(' ')
+    norm = norm.replace(' and ', ' ')
+    if norm.startswith('the '):
+        norm = norm[4:]
+    elif norm.startswith('a '):
+        norm = norm[2:]
+    return norm.replace('-', '').replace(' ', '')
+
+def build_work_title_map(equiv, norm_titles):
+    title_to_work_title = defaultdict(set)
+    for (norm_title, norm_wt), v in equiv.items():
+        if v != 1:
+            title_to_work_title[norm_title].add(norm_wt)
+
+    title_map = {}
+    for title, v in title_to_work_title.items():
+        if len(v) == 1:
+            title_map[title] = list(v)[0]
+            continue
+        most_common_title = max(v, key=lambda i:norm_titles[i])
+        if title != most_common_title:
+            title_map[title] = most_common_title
+        for i in v:
+            if i != most_common_title:
+                title_map[i] = most_common_title
+    return title_map
+
+
+milo_m_hastings = [
+    {'lang': ['eng'], 'key': '/b/OL7009753M', 'title': 'The dollar hen'},
+    {'lang': ['eng'], 'key': '/b/OL9563276M', 'title': 'The Dollar Hen (Large Print Edition)'},
+    {'lang': ['eng'], 'key': '/b/OL9636071M', 'title': 'The Dollar Hen'},
+    {'lang': ['eng'], 'key': '/b/OL15083244M', 'title': 'The dollar hen'},
+    {'lang': ['eng'], 'key': '/b/OL8566971M', 'title': 'The Dollar Hen'},
+    {'lang': ['eng'], 'key': '/b/OL9353753M', 'title': 'City of Endless Night'},
+    {'lang': ['eng'], 'key': '/b/OL9462083M', 'title': 'City of Endless Night (Large Print Edition)'},
+    {'lang': ['eng'], 'key': '/b/OL9642528M', 'title': 'The Dollar Hen'},
+    {'lang': ['eng'], 'key': '/b/OL9736536M', 'title': 'The Dollar Hen'},
+    {'lang': ['eng'], 'key': '/b/OL9735362M', 'title': 'The Dollar Hen (Illustrated Edition) (Dodo Press)'},
+    {'lang': ['eng'], 'key': '/b/OL9800490M', 'title': 'The Dollar Hen'},
+    {'lang': ['eng'], 'key': '/b/OL11676559M', 'title': 'City of Endless Night (Dodo Press)'},
+    {'lang': ['eng'], 'key': '/b/OL11752220M', 'title': 'The Dollar Hen'},
+    {'lang': ['eng'], 'key': '/b/OL11985500M', 'title': 'The Dollar Hen'},
+    {'lang': ['eng'], 'key': '/b/OL11985503M', 'title': 'The Dollar Hen'}
+]
+
+aaron_bancroft = [ # /a/OL17005A
+    {'lang': ['eng'], 'key': '/b/OL595471M', 'title': 'A sermon preached before His Excellency Caleb Strong, Esq., Governour, the Honourable the Council, Senate, and House of Representatives of the commonwealth of Massachusetts, May 27, 1801'},
+    {'lang': ['eng'], 'key': '/b/OL1247387M', 'title': 'A discourse delivered before the convention of Congregational ministers of Massachusetts, at their annual meeting in Boston, June 1, 1820'},
+    {'lang': ['eng'], 'key': '/b/OL6472976M', 'title': 'The importance of a religious education illustrated and enforced'},
+    {'lang': ['eng'], 'key': '/b/OL6919451M', 'title': 'A discourse delivered at Windsor, in the state of Vermont, on the 23rd of June, MDCCXC'},
+    {'lang': ['eng'], 'key': '/b/OL6950265M', 'title': 'A sermon delivered in Worcester, January 31, 1836'},
+    {'key': '/b/OL7048038M', 'title': 'Sermons on those doctrines of the gospel, and on those constituent principles of the church, which Christian professors have made the subject of controversy. ..'},
+    {'key': '/b/OL7197334M', 'title': 'The life of George Washington ....'},
+    {'lang': ['eng'], 'key': '/b/OL14572992M', 'title': 'A sermon, delivered at Worcester, on the eleventh of June, 1793'},
+    {'lang': ['eng'], 'key': '/b/OL14588026M', 'title': 'An eulogy on the character of the late Gen. George Washington.'},
+    {'lang': ['eng'], 'key': '/b/OL14601446M', 'title': 'A sermon, delivered at Brimfield, on the 20th of June, 1798'},
+    {'lang': ['eng'], 'key': '/b/OL14608347M', 'title': 'The importance of a religious education illustrated and enforced.'},
+    {'lang': ['eng'], 'key': '/b/OL14702050M', 'title': 'The nature and worth of Christian liberty'},
+    {'lang': ['eng'], 'key': '/b/OL14981988M', 'title': 'A vindication of the result of the late Mutual Council convened in Princeton'},
+    {'lang': ['eng'], 'key': '/b/OL14992328M', 'title': 'An essay on the life of George Washington'},
+    {'lang': ['eng'], 'key': '/b/OL15054440M', 'title': 'Importance of education'},
+    {'lang': ['eng'], 'key': '/b/OL15070888M', 'title': 'The leaf an emblem of human life'},
+    {'lang': ['eng'], 'key': '/b/OL15075529M', 'title': 'The world passeth away, but the children of God abide forever'},
+    {'lang': ['eng'], 'key': '/b/OL15085786M', 'title': 'The doctrine of immortality'},
+    {'lang': ['eng'], 'key': '/b/OL15093560M', 'title': 'The comparative advantages of the ministerial profession'},
+    {'lang': ['eng'], 'key': '/b/OL15115706M', 'title': 'The duties enjoined by the Fourth commandment'},
+    {'lang': ['eng'], 'key': '/b/OL15120201M', 'title': 'A discourse on conversion'},
+    {'lang': ['eng'], 'key': '/b/OL15120290M', 'title': 'The nature and worth of Christian liberty'},
+    {'lang': ['eng'], 'key': '/b/OL17052663M', 'title': 'An eulogy on the character of the late Gen. George Washington'},
+    {'lang': ['eng'], 'key': '/b/OL17704747M', 'title': 'The doctrine of immortality'},
+    {'lang': ['eng'], 'key': '/b/OL17707429M', 'title': 'Importance of education'},
+    {'lang': ['eng'], 'key': '/b/OL17709244M', 'title': 'A vindication of the result of the late mutual council convened in Princeton'},
+    {'lang': ['eng'], 'key': '/b/OL18776110M', 'title': 'Sermons on those doctrines of the gospel, and on those constituent principles of the church, which Christian professors have made the subject of controversy'},
+    {'lang': ['eng'], 'key': '/b/OL6573411M', 'title': 'The life of George Washington, commander in chief of the American army, through the revolutionary war'},
+    {'lang': ['eng'], 'key': '/b/OL15592993M', 'title': 'A discourse on conversion'},
+    {'lang': ['eng'], 'key': '/b/OL17712475M', 'title': 'A discourse on conversion'},
+    {'lang': ['eng'], 'key': '/b/OL6290214M', 'title': 'The life of George Washington'},
+    {'lang': ['eng'], 'key': '/b/OL6571503M', 'title': 'The life of George Washington'},
+    {'lang': ['eng'], 'key': '/b/OL6573412M', 'title': 'Life of George Washington'},
+    {'work_title': 'Essay on the life of George Washington', 'key': '/b/OL7168113M', 'title': 'Life of George Washington, commander in chief of the American army through the revolutionary war, and the first president of the United States.'},
+    {'work_title': 'Essay on the life of George Washington', 'key': '/b/OL7243025M', 'title': 'The life of George Washington, commander in chief of the American army, through the revolutionary war, and the first president of the United States'},
+    {'lang': ['eng'], 'key': '/b/OL28289M', 'title': 'The life of George Washington, commander-in-chief of the American Army through the Revolutionary War and the first President of the United States'},
+    {'lang': ['eng'], 'key': '/b/OL6354818M', 'title': 'The life of George Washington, commander-in-chief of the American Army through the revolutionary war, and the first president of the United States.'},
+    {'key': '/b/OL7113589M', 'title': 'The life of George Washington, Commander-in-Chief of the American Army, through the Revolutionary War; and the first President of the United States.'}
+]
+
+def find_works(books):
+    for book in books:
+        m = re_parens.match(book['title'])
+        if m:
+            book['title'] = m.group(1)
+        n = mk_norm(book['title'])
+        book['norm_title'] = n
+
+    books_by_key = dict((b['key'], b) for b in books)
+    norm_titles = defaultdict(int)
+
+    for book in books:
+        norm_titles[book['norm_title']] += 1
+
+    title_map = build_work_title_map({}, norm_titles)
+
+    works = defaultdict(lambda: defaultdict(list))
+    work_titles = defaultdict(list)
+    for b in books:
+        if 'eng' not in b.get('lang', []) and 'norm_wt' in b:
+            work_titles[b['norm_wt']].append(b['key'])
+            continue
+        n = b['norm_title']
+        title = b['title']
+        if n in title_map:
+            n = title_map[n]
+            title = freq_dict_top(rev_wt[n])
+        works[n][title].append(b['key'])
+
+    #for k, v in works.items():
+    #    print k
+    #    print '  ', sum(len(i) for i in v.values()), dict(v)
+    #print
+
+    works = sorted([(sum(map(len, w.values() + [work_titles[n]])), n, w) for n, w in works.items()])
+
+    for a, b, c in works:
+        print(a, b, dict(c))
+
+find_works(milo_m_hastings)
+find_works(aaron_bancroft)
diff --git a/ia-legacy-importer/works/use_amazon.py b/ia-legacy-importer/works/use_amazon.py
new file mode 100755
index 00000000..dee37cf4
--- /dev/null
+++ b/ia-legacy-importer/works/use_amazon.py
@@ -0,0 +1,78 @@
+from __future__ import print_function
+import os
+import re
+import sys
+import codecs
+import dbhash
+from catalog.amazon.other_editions import find_others
+from catalog.infostore import get_site
+from catalog.read_rc import read_rc
+from catalog.get_ia import get_data
+from catalog.marc.build_record import build_record
+from catalog.marc.fast_parse import get_tag_lines, get_all_subfields
+
+sys.stdout = codecs.getwriter('utf-8')(sys.stdout)
+rc = read_rc()
+db = dbhash.open(rc['index_path'] + 'isbn_to_marc.dbm', 'r')
+
+site = get_site()
+
+def get_records_from_marc(isbn):
+    if isbn not in db:
+        return
+#    for loc in db[isbn].split(' '):
+#        data = get_data(loc)
+#        print loc
+#        want = ['100', '110', '111', '240', '245', '260'] + [str(i) for i in range(500,600) if i not in (505, 520)]
+#        for tag, line in get_tag_lines(data, set(want)):
+#            sub = list(get_all_subfields(line))
+#            if tag.startswith('5'):
+#                assert len(sub) == 1 and sub[0][0] == 'a'
+#                note = sub[0][1]
+#                if note.find('ublish') != -1 or note.find('riginal') != -1:
+#                    print '  note:', note
+#                continue
+#            print '  ', tag, sub
+#        print
+    recs = [(loc, build_record(get_data(loc))) for loc in db[isbn].split(' ')]
+    keys = set()
+    print()
+    for loc, rec in recs:
+        print('  ', loc)
+#        keys.update([k for k in rec.keys() if k.find('title') != -1 or k in ('authors', 'title', 'contributions', 'work_title')])
+        keys.update(rec.keys())
+    print()
+    for k in keys:
+        print(k)
+        for loc, rec in recs:
+            print("  ", rec.get(k, '###'))
+        print()
+    print()
+
+dir = sys.argv[1]
+for filename in os.listdir(dir):
+    if not filename[0].isdigit():
+        continue
+    l = find_others(filename, dir)
+    if not l:
+        continue
+    print(filename)
+    for k in site.things({'isbn_10': filename, 'type': '/type/edition'}):
+        t = site.withKey(k)
+        num = len(t.isbn_10)
+        if num == 1:
+            num = ''
+        print('  OL:', k, t.title, num)
+        get_records_from_marc(filename)
+    for asin, extra in l:
+        print(asin, extra)
+        things = site.things({'isbn_10': asin, 'type': '/type/edition'})
+        if things:
+            for k in things:
+                t = site.withKey(k)
+                num = len(t.isbn_10)
+                if num == 1:
+                    num = ''
+                print('  OL:', k, t.title, num)
+        get_records_from_marc(asin)
+    print("----")
diff --git a/ia-legacy-importer/works/use_amazon2.py b/ia-legacy-importer/works/use_amazon2.py
new file mode 100755
index 00000000..369b0176
--- /dev/null
+++ b/ia-legacy-importer/works/use_amazon2.py
@@ -0,0 +1,27 @@
+from __future__ import print_function
+import os
+import re
+import sys
+import codecs
+import dbhash
+from catalog.amazon.other_editions import find_others
+from catalog.infostore import get_site
+from catalog.read_rc import read_rc
+from catalog.get_ia import get_data
+from catalog.marc.build_record import build_record
+from catalog.marc.fast_parse import get_tag_lines, get_all_subfields
+
+sys.stdout = codecs.getwriter('utf-8')(sys.stdout)
+rc = read_rc()
+db = dbhash.open(rc['index_path'] + 'isbn_to_marc.dbm', 'r')
+
+site = get_site()
+
+dir = sys.argv[1]
+for filename in os.listdir(dir):
+    if not filename[0].isdigit():
+        continue
+    l = find_others(filename, dir)
+    if len(l) < 8:
+        continue
+    print(filename, len(l))
diff --git a/ia-legacy-importer/works/web_ui.py b/ia-legacy-importer/works/web_ui.py
new file mode 100644
index 00000000..10227b48
--- /dev/null
+++ b/ia-legacy-importer/works/web_ui.py
@@ -0,0 +1,178 @@
+from __future__ import print_function
+import web
+import re
+from time import time
+from catalog.read_rc import read_rc
+from catalog.infostore import get_site
+#from catalog.db_read import get_things, withKey
+from catalog.amazon.other_editions import find_others
+from catalog.merge.normalize import normalize
+
+rc = read_rc()
+
+re_translation_of = re.compile('^Translation of\b[: ]*([^\n]*?)\.?$', re.I | re.M)
+
+site = get_site()
+
+def isbn_link(i):
+    return '<a href="http://wiki-beta.us.archive.org:8081/?isbn=%s">%s</a> (<a href="http://amazon.com/dp/%s">Amazon.com</a>)' % (i, i, i)
+
+def ol_link(key):
+    return '<a href="http://openlibrary.org%s">%s</a></td>' % (key, key)
+
+def get_author_keys(name):
+    authors = site.things({ 'type': '/type/author', 'name': name })
+    if authors:
+        return ','.join("'%s'" % a for a in authors)
+    else:
+        return None
+
+def get_title_to_key(author):
+    # get id to key mapping of all editions by author
+    author_keys = get_author_keys(author)
+    if not author_keys:
+        return {}
+
+    # get title to key mapping of all editions by author
+    t0 = time()
+    sql = "select key, value as title from thing, edition_str " \
+        + "where thing.id = thing_id and key_id=3 and thing_id in (" \
+        + "select thing_id from edition_ref, thing " \
+        + "where edition_ref.key_id=11 and edition_ref.value = thing.id and thing.key in (" + author_keys + "))"
+    print(sql)
+    return {}
+    title_to_key = {}
+    for r in web.query(sql):
+        t = normalize(r.title).strip('.')
+        title_to_key.setdefault(t, []).append(r.key)
+    return title_to_key
+
+def search(title, author):
+
+    title_to_key = get_title_to_key(author)
+    norm_title = normalize(title).strip('.')
+
+    if norm_title not in title_to_key:
+        print('title not found')
+        return
+
+    pool = set(title_to_key[norm_title])
+
+    editions = []
+    seen = set()
+    found_titles = {}
+    found_isbn = {}
+    while pool:
+        key = pool.pop()
+        seen.add(key)
+        e = site.withKey(key)
+        translation_of = None
+        if False and e.notes:
+            m = re_translation_of.search(e.notes)
+            if m:
+                translation_of = m.group(1).lower()
+                pool.update(k for k in title_to_key[translation_of] if k not in seen)
+                found_titles.setdefault(translation_of, []).append(key)
+        if False and e.isbn_10:
+            for i in e.isbn_10:
+                found_isbn.setdefault(i, []).append(key)
+            join_isbn = ', '.join(map(isbn_link, e.isbn_10))
+        else:
+            join_isbn = ''
+        rec = {
+            'key': key,
+            'publish_date': e.publish_date,
+            'publishers': ', '.join(p.encode('utf-8') for p in (e.publishers or [])),
+            'isbn': join_isbn,
+        }
+        editions.append(rec)
+
+        if e.work_titles:
+            for t in e.work_titles:
+                t=t.strip('.')
+                pool.update(k for k in title_to_key.get(t.lower(), []) if k not in seen)
+                found_titles.setdefault(t, []).append(key)
+        if e.other_titles:
+            for t in e.other_titles:
+                t=t.strip('.')
+                pool.update(k for k in title_to_key.get(t.lower(), []) if k not in seen)
+                found_titles.setdefault(t, []).append(key)
+
+    print('<table>')
+    for e in sorted(editions, key=lambda e: e['publish_date'] and e['publish_date'][-4:]):
+        print('<tr>')
+        print('<td>', ol_link(e['key']))
+        print('<td>', e['publish_date'], '</td><td>', e['publishers'], '</td>')
+        print('<td>', e['isbn'], '</td>')
+        print('</tr>')
+    print('</table>')
+
+    if found_titles:
+        print('<h2>Other titles</h2>')
+        print('<ul>')
+        for k, v in found_titles.iteritems():
+            if k == title:
+                continue
+            print('<li><a href="/?title=%s&author=%s">%s</a>' % (k, author, k), end=' ')
+            print('from', ', '.join(ol_link(i) for i in v))
+        print('</ul>')
+
+    extra_isbn = {}
+    for k, v in found_isbn.iteritems():
+        for isbn, note in find_others(k, rc['amazon_other_editions']):
+            if note.lower().find('audio') != -1:
+                continue
+            if isbn not in found_isbn:
+                extra_isbn.setdefault(isbn, []).extend(v)
+
+    if extra_isbn:
+        print('<h2>Other ISBN</h2>')
+        print('<ul>')
+        for k in sorted(extra_isbn):
+            print('<li>', isbn_link(k), end=' ')
+            print('from', ', '.join(ol_link(i) for i in extra_isbn[k]))
+        print('</ul>')
+
+urls = (
+    '/', 'index'
+)
+
+def textbox(name, input):
+    if name in input:
+        return '<input type="text" name="%s" value="%s" size="60">' % (name, web.htmlquote(input[name]))
+    else:
+        return '<input type="text" name="%s" size="60">' % (name)
+
+class index:
+    def GET(self):
+        web.header('Content-Type','text/html; charset=utf-8', unique=True)
+        input = web.input()
+        title = None
+        author = None
+        if 'title' in input:
+            title = input.title
+        if 'author' in input:
+            author = input.author
+        html_title = 'Work finder'
+        print("<html>\n<head>\n<title>%s</title>" % html_title)
+        print('''
+<style>
+th { text-align: left }
+td { padding: 5px; background: #eee }
+</style>''')
+
+        print('</head><body><a name="top">')
+
+        print("<body><html>")
+        print('<form name="main" method="get">')
+        print('<table><tr><td align="right">Title</td>', end=' ')
+        print('<td>', textbox('title', input), '</td></tr>')
+        print('<tr><td align="right">Author</td>')
+        print('<td>', textbox('author', input), '</td></tr>')
+        print('<tr><td></td><td><input type="submit" value="find"></td></tr>')
+        print('</table>')
+        if title and author:
+            search(title, author)
+        print('</form>')
+
+if __name__ == "__main__": web.run(urls, globals(), web.reloader)