<html xmlns:v="urn:schemas-microsoft-com:vml" xmlns:o="urn:schemas-microsoft-com:office:office" xmlns:w="urn:schemas-microsoft-com:office:word" xmlns:m="http://schemas.microsoft.com/office/2004/12/omml" xmlns="http://www.w3.org/TR/REC-html40">
<head>
<meta http-equiv="Content-Type" content="text/html; charset=us-ascii">
<meta name="Generator" content="Microsoft Word 15 (filtered medium)">
<style><!--
/* Font Definitions */
@font-face
        {font-family:Wingdings;
        panose-1:5 0 0 0 0 0 0 0 0 0;}
@font-face
        {font-family:"Cambria Math";
        panose-1:2 4 5 3 5 4 6 3 2 4;}
@font-face
        {font-family:Calibri;
        panose-1:2 15 5 2 2 2 4 3 2 4;}
/* Style Definitions */
p.MsoNormal, li.MsoNormal, div.MsoNormal
        {margin:0in;
        margin-bottom:.0001pt;
        font-size:11.0pt;
        font-family:"Calibri",sans-serif;}
a:link, span.MsoHyperlink
        {mso-style-priority:99;
        color:#0563C1;
        text-decoration:underline;}
a:visited, span.MsoHyperlinkFollowed
        {mso-style-priority:99;
        color:#954F72;
        text-decoration:underline;}
p.MsoListParagraph, li.MsoListParagraph, div.MsoListParagraph
        {mso-style-priority:34;
        margin-top:0in;
        margin-right:0in;
        margin-bottom:0in;
        margin-left:.5in;
        margin-bottom:.0001pt;
        font-size:11.0pt;
        font-family:"Calibri",sans-serif;}
p.msonormal0, li.msonormal0, div.msonormal0
        {mso-style-name:msonormal;
        mso-margin-top-alt:auto;
        margin-right:0in;
        mso-margin-bottom-alt:auto;
        margin-left:0in;
        font-size:11.0pt;
        font-family:"Calibri",sans-serif;}
span.EmailStyle18
        {mso-style-type:personal;
        font-family:"Calibri",sans-serif;
        color:windowtext;}
span.EmailStyle19
        {mso-style-type:personal-reply;
        font-family:"Calibri",sans-serif;
        color:windowtext;}
.MsoChpDefault
        {mso-style-type:export-only;
        font-size:10.0pt;}
@page WordSection1
        {size:8.5in 11.0in;
        margin:1.0in 1.0in 1.0in 1.0in;}
div.WordSection1
        {page:WordSection1;}
/* List Definitions */
@list l0
        {mso-list-id:1561944021;
        mso-list-type:hybrid;
        mso-list-template-ids:-1919241760 67698703 67698713 67698715 67698703 67698713 67698715 67698703 67698713 67698715;}
@list l0:level1
        {mso-level-tab-stop:none;
        mso-level-number-position:left;
        text-indent:-.25in;}
@list l0:level2
        {mso-level-number-format:alpha-lower;
        mso-level-tab-stop:none;
        mso-level-number-position:left;
        text-indent:-.25in;}
@list l0:level3
        {mso-level-number-format:roman-lower;
        mso-level-tab-stop:none;
        mso-level-number-position:right;
        text-indent:-9.0pt;}
@list l0:level4
        {mso-level-tab-stop:none;
        mso-level-number-position:left;
        text-indent:-.25in;}
@list l0:level5
        {mso-level-number-format:alpha-lower;
        mso-level-tab-stop:none;
        mso-level-number-position:left;
        text-indent:-.25in;}
@list l0:level6
        {mso-level-number-format:roman-lower;
        mso-level-tab-stop:none;
        mso-level-number-position:right;
        text-indent:-9.0pt;}
@list l0:level7
        {mso-level-tab-stop:none;
        mso-level-number-position:left;
        text-indent:-.25in;}
@list l0:level8
        {mso-level-number-format:alpha-lower;
        mso-level-tab-stop:none;
        mso-level-number-position:left;
        text-indent:-.25in;}
@list l0:level9
        {mso-level-number-format:roman-lower;
        mso-level-tab-stop:none;
        mso-level-number-position:right;
        text-indent:-9.0pt;}
@list l1
        {mso-list-id:1689136040;
        mso-list-type:hybrid;
        mso-list-template-ids:675705410 67698689 67698691 67698693 67698689 67698691 67698693 67698689 67698691 67698693;}
@list l1:level1
        {mso-level-number-format:bullet;
        mso-level-text:\F0B7;
        mso-level-tab-stop:none;
        mso-level-number-position:left;
        text-indent:-.25in;
        font-family:Symbol;}
@list l1:level2
        {mso-level-number-format:bullet;
        mso-level-text:o;
        mso-level-tab-stop:none;
        mso-level-number-position:left;
        text-indent:-.25in;
        font-family:"Courier New";}
@list l1:level3
        {mso-level-number-format:bullet;
        mso-level-text:\F0A7;
        mso-level-tab-stop:none;
        mso-level-number-position:left;
        text-indent:-.25in;
        font-family:Wingdings;}
@list l1:level4
        {mso-level-number-format:bullet;
        mso-level-text:\F0B7;
        mso-level-tab-stop:none;
        mso-level-number-position:left;
        text-indent:-.25in;
        font-family:Symbol;}
@list l1:level5
        {mso-level-number-format:bullet;
        mso-level-text:o;
        mso-level-tab-stop:none;
        mso-level-number-position:left;
        text-indent:-.25in;
        font-family:"Courier New";}
@list l1:level6
        {mso-level-number-format:bullet;
        mso-level-text:\F0A7;
        mso-level-tab-stop:none;
        mso-level-number-position:left;
        text-indent:-.25in;
        font-family:Wingdings;}
@list l1:level7
        {mso-level-number-format:bullet;
        mso-level-text:\F0B7;
        mso-level-tab-stop:none;
        mso-level-number-position:left;
        text-indent:-.25in;
        font-family:Symbol;}
@list l1:level8
        {mso-level-number-format:bullet;
        mso-level-text:o;
        mso-level-tab-stop:none;
        mso-level-number-position:left;
        text-indent:-.25in;
        font-family:"Courier New";}
@list l1:level9
        {mso-level-number-format:bullet;
        mso-level-text:\F0A7;
        mso-level-tab-stop:none;
        mso-level-number-position:left;
        text-indent:-.25in;
        font-family:Wingdings;}
ol
        {margin-bottom:0in;}
ul
        {margin-bottom:0in;}
--></style><!--[if gte mso 9]><xml>
<o:shapedefaults v:ext="edit" spidmax="1026" />
</xml><![endif]--><!--[if gte mso 9]><xml>
<o:shapelayout v:ext="edit">
<o:idmap v:ext="edit" data="1" />
</o:shapelayout></xml><![endif]-->
</head>
<body lang="EN-US" link="#0563C1" vlink="#954F72">
<div class="WordSection1">
<p class="MsoNormal">John,<o:p></o:p></p>
<p class="MsoNormal"><o:p> </o:p></p>
<p class="MsoNormal">What I think that you’d want to do in this case is to modify the EAD so that it looks like the following:<o:p></o:p></p>
<p class="MsoNormal"><o:p> </o:p></p>
<p class="MsoNormal"><span style="font-size:12.0pt;font-family:"Arial",sans-serif;color:#000096;background:white;mso-highlight:white"><physdesc</span><span style="font-size:12.0pt;font-family:"Arial",sans-serif;color:#F5844C;background:white;mso-highlight:white">
 label</span><span style="font-size:12.0pt;font-family:"Arial",sans-serif;color:#FF8040;background:white;mso-highlight:white">=</span><span style="font-size:12.0pt;font-family:"Arial",sans-serif;color:#993300;background:white;mso-highlight:white">"Extent:"</span><span style="font-size:12.0pt;font-family:"Arial",sans-serif;color:#F5844C;background:white;mso-highlight:white">
 encodinganalog</span><span style="font-size:12.0pt;font-family:"Arial",sans-serif;color:#FF8040;background:white;mso-highlight:white">=</span><span style="font-size:12.0pt;font-family:"Arial",sans-serif;color:#993300;background:white;mso-highlight:white">"300"</span><span style="font-size:12.0pt;font-family:"Arial",sans-serif;color:#000096;background:white;mso-highlight:white">><o:p></o:p></span></p>
<p class="MsoNormal" style="text-indent:.5in"><span style="font-size:12.0pt;font-family:"Arial",sans-serif;color:#000096;background:white;mso-highlight:white"><extent></span><span style="font-size:12.0pt;font-family:"Arial",sans-serif;color:black;background:white;mso-highlight:white">15.0
 linear_feet</span><span style="font-size:12.0pt;font-family:"Arial",sans-serif;color:#000096;background:white;mso-highlight:white"></extent></span><span style="font-size:12.0pt;font-family:"Arial",sans-serif;color:black;background:white;mso-highlight:white"><o:p></o:p></span></p>
<p class="MsoNormal" style="text-indent:.5in"><span style="font-size:12.0pt;font-family:"Arial",sans-serif;color:#000096;background:white;mso-highlight:white"><extent></span><span style="font-size:12.0pt;font-family:"Arial",sans-serif;color:black;background:white;mso-highlight:white">(36
 boxes + oversize folder)</span><span style="font-size:12.0pt;font-family:"Arial",sans-serif;color:#000096;background:white;mso-highlight:white"></extent></span><span style="font-size:12.0pt;font-family:"Arial",sans-serif;color:black;background:white;mso-highlight:white"><o:p></o:p></span></p>
<p class="MsoNormal"><span style="font-size:12.0pt;font-family:"Arial",sans-serif;color:#000096;background:white;mso-highlight:white"></physdesc></span><o:p></o:p></p>
<p class="MsoNormal"><o:p> </o:p></p>
<p class="MsoNormal">Two important points about this:<o:p></o:p></p>
<p class="MsoNormal"><o:p> </o:p></p>
<ol style="margin-top:0in" start="1" type="1">
<li class="MsoListParagraph" style="margin-left:0in;mso-list:l0 level1 lfo2">The ASpace EAD importer uses the database values for controlled value fields, which is why I’ve changed linear feet to “linear_feet”  (“linear_feet” is one of the database values available
 in ASpace by default, but if that’s not the value that matches your YML translation, you might want to use another one).  The ASpace EAD exporter, on the other hand, will use the YML translation when exporting the EAD, so you’d wind up with “linear feet” in
 the export, or whatever else is specified in the YML file that’s being employed by your application.<o:p></o:p></li><li class="MsoListParagraph" style="margin-left:0in;mso-list:l0 level1 lfo2">Whatever you put into a second extent statement will be mapped to the Container Summary field in ArchivesSpace.<o:p></o:p></li></ol>
<p class="MsoNormal"><o:p> </o:p></p>
<p class="MsoNormal">This is essentially following the AT model for importing EAD physdesc elements.  I wish, instead, that ASpace would only add extent values based on the availability of the extent/@unit attribute in EAD 2002.   That would make things a lot
 less dicey than trying to  parse the text field of an extent element during import time, but it would require more EAD manipulation for a lot of folks before importing that data since the @unit attribute isn’t heavily used.<o:p></o:p></p>
<p class="MsoNormal"><o:p> </o:p></p>
<p class="MsoNormal">Mark<o:p></o:p></p>
<p class="MsoNormal"><o:p> </o:p></p>
<p class="MsoNormal">p.s.   the physdesc/@label attribute, however, does NOT get mapped at all by ASpace.  Instead, it’s dropped silently during the import process.  That used to be the case, at least.  I haven’t checked in a while to see if that behavior has
 been changed, but in general label attributes and head elements will usually map to the ASpace label field.<o:p></o:p></p>
<p class="MsoNormal"><o:p> </o:p></p>
<p class="MsoNormal">p.p.s. I’ve never tested to see what happens if you have a third sibling extent statement (to see if those get dropped or appended to container summary).  But I have tested using dimensions and/or physfacet within the same grouping, and
 those are imported as expected.<o:p></o:p></p>
<p class="MsoNormal"><o:p> </o:p></p>
<p class="MsoNormal"><o:p> </o:p></p>
<p class="MsoNormal"><o:p> </o:p></p>
<p class="MsoNormal"><o:p> </o:p></p>
<div>
<div style="border:none;border-top:solid #E1E1E1 1.0pt;padding:3.0pt 0in 0in 0in">
<p class="MsoNormal"><b>From:</b> archivesspace_users_group-bounces@lyralists.lyrasis.org [mailto:archivesspace_users_group-bounces@lyralists.lyrasis.org]
<b>On Behalf Of </b>Rees, John (NIH/NLM) [E]<br>
<b>Sent:</b> Thursday, 21 June, 2018 3:43 PM<br>
<b>To:</b> Archivesspace Users Group <archivesspace_users_group@lyralists.lyrasis.org><br>
<b>Subject:</b> [Archivesspace_Users_Group] EAD import extents mapping<o:p></o:p></p>
</div>
</div>
<p class="MsoNormal"><o:p> </o:p></p>
<p class="MsoNormal" style="background:white;text-autospace:none"><span style="font-size:12.0pt;font-family:"Arial",sans-serif">Using the background job importer, I’m trying to import extent data from EAD 2002 schema XML, specifically the other extent data
 we record in parenthesis like <span style="color:#000096;background:white;mso-highlight:white">
<physdesc</span><span style="color:#F5844C;background:white;mso-highlight:white"> label</span><span style="color:#FF8040;background:white;mso-highlight:white">=</span><span style="color:#993300;background:white;mso-highlight:white">"Extent:"</span><span style="color:#F5844C;background:white;mso-highlight:white">
 encodinganalog</span><span style="color:#FF8040;background:white;mso-highlight:white">=</span><span style="color:#993300;background:white;mso-highlight:white">"300"</span><span style="color:#000096;background:white;mso-highlight:white">></span><span style="color:black;background:white;mso-highlight:white">
</span><span style="color:#000096;background:white;mso-highlight:white"><extent></span><span style="color:black;background:white;mso-highlight:white">15.0 linear feet (36 boxes + oversize folder)</span><span style="color:#000096;background:white;mso-highlight:white"></extent></span><span style="color:black;background:white;mso-highlight:white">
</span><span style="color:#000096;background:white;mso-highlight:white"></physdesc></span><span style="background:white;mso-highlight:white"><o:p></o:p></span></span></p>
<p class="MsoNormal"><span style="font-size:12.0pt;font-family:"Arial",sans-serif"><o:p> </o:p></span></p>
<p class="MsoNormal"><span style="font-size:12.0pt;font-family:"Arial",sans-serif">I’d like these parenthetical statements to map to the Container Summary field. According to the EAD import mapper
<a href="https://na01.safelinks.protection.outlook.com/?url=http%3A%2F%2Farchivesspace.org%2Fwp-content%2Fuploads%2F2016%2F05%2FEAD-Import-Export-Mapping-20171030.xlsx&data=02%7C01%7Cmark.custer%40yale.edu%7C7fd7312237a74499772f08d5d7af3fb7%7Cdd8cbebb21394df8b4114e3e87abeb5c%7C0%7C1%7C636652070056478978&sdata=pB8JYJlx5gpDPD8ugiqZReY2BLk60%2BkfTaOHex%2B0EEU%3D&reserved=0">
http://archivesspace.org/wp-content/uploads/2016/05/EAD-Import-Export-Mapping-20171030.xlsx</a> anything after a number and space that can’t be parsed should import into Container Summary.<o:p></o:p></span></p>
<p class="MsoNormal"><span style="font-size:12.0pt;font-family:"Arial",sans-serif"><o:p> </o:p></span></p>
<p class="MsoNormal"><span style="font-size:12.0pt;font-family:"Arial",sans-serif">Is there a syntax for making this string unparsable and force this behavior? Currently “<span style="color:black;background:white;mso-highlight:white">linear feet (36 boxes +
 oversize folder)</span><span style="color:black">” from the above imports to Extent @Type as a new unique value and I don’t want all that data pollution.<o:p></o:p></span></span></p>
<p class="MsoNormal"><span style="font-size:12.0pt;font-family:"Arial",sans-serif;color:black"><o:p> </o:p></span></p>
<p class="MsoNormal"><span style="font-size:12.0pt;font-family:"Arial",sans-serif;color:black">Thanks,<o:p></o:p></span></p>
<p class="MsoNormal"><span style="font-size:12.0pt;font-family:"Arial",sans-serif;color:black">John<o:p></o:p></span></p>
<p class="MsoNormal"><o:p> </o:p></p>
<p class="MsoNormal">John P. Rees<o:p></o:p></p>
<p class="MsoNormal">Archivist and Digital Resources Manager<o:p></o:p></p>
<p class="MsoNormal">History of Medicine Division<o:p></o:p></p>
<p class="MsoNormal">National Library of Medicine<o:p></o:p></p>
<p class="MsoNormal">301-827-4510<o:p></o:p></p>
<p class="MsoNormal"><o:p> </o:p></p>
<p class="MsoNormal"><span style="font-size:12.0pt;font-family:"Arial",sans-serif"><o:p> </o:p></span></p>
</div>
</body>
</html>