<?xml version="1.0" encoding="UTF-8"?>
<TEI.2 id="poster_178_iacob">
   <teiHeader>
      <fileDesc>
         <titleStmt>
            <title>Edition Production Technology: an Eclipse-Based Platform for Building Image-Based Electronic Editions</title>
            <author>
               <name reg="Iacob, Ionut Emil">Ionut Emil Iacob</name>
            </author>
            <author>
               <name reg="Kiernan, Kevin">Kevin Kiernan</name>
            </author>
            <author>
               <name reg="Dekhtyar, Alex">Alex Dekhtyar</name>
            </author>
            <respStmt>
               <resp>Marked up by </resp>
               <name reg="Holmes, Martin">Martin Holmes</name>
               <lb/>
               <name reg="Baer, Patricia">Patricia Baer</name>
            </respStmt>
         </titleStmt>
         <publicationStmt>
            <p>Marked up to be included in the ACH/ALLC 2005 Conference Abstracts book.</p>
         </publicationStmt>
         <sourceDesc>
            <p>None</p>
         </sourceDesc>
      </fileDesc>
      <profileDesc>
         <textClass>
            <classCode>poster</classCode>
            <keywords>
               <list>
                  <item>image-based electronic editing</item>
                  <item>editing tools</item>
               </list>
            </keywords>
         </textClass>
      </profileDesc>
      <revisionDesc>
         <list>
            <item>MDH: Created from John Bradley's XML <date value="2005-03">March 2005</date>
            </item>
            <item>PAB: Marked up <date value="2005-04-12">12 April 2005</date>
            </item>
            <item>MDH: RS proofed and signed off without changes <date value="2005-05-18">18 May 2005</date>.</item>
         </list>
      </revisionDesc>
   </teiHeader>
   <text>
      <front>
         <docTitle n="Edition Production Technology: an Eclipse-Based Platform for Building Image-Based Electronic Editions">
            <titlePart>
               <title level="m">Edition Production Technology</title>: an <title level="m">Eclipse</title>-Based Platform for Building Image-Based Electronic Editions</titlePart>
         </docTitle>
         <docAuthor>
            <name reg="Iacob, Ionut Emil">Ionut Emil Iacob</name>
            <address>
               <addrLine>ionut@ms.uky.edu</addrLine>
            </address>
         </docAuthor>
         <titlePart type="affil">Department of Computer Science, University of Kentucky</titlePart>
         <docAuthor>
            <name reg="Kiernan, Kevin">Kevin Kiernan</name>
            <address>
               <addrLine>kiernan@uky.edu</addrLine>
            </address>
         </docAuthor>
         <titlePart type="affil">Department of English, University of Kentucky</titlePart>
         <docAuthor>
            <name reg="Dekhtyar, Alex">Alex Dekhtyar</name>
            <address>
               <addrLine>dekhtyar@cs.uky.edu</addrLine>
            </address>
         </docAuthor>
         <titlePart type="affil">Department of Computer Science, University of Kentucky</titlePart>
      </front>
      <body>
         <div0>
            <p>
We are developing the <title level="m">Edition Production Technology</title> (<title level="m">EPT</title>), an integrated development environment for building Image-based Electronic Editions (IBEE) (Kiernan 2005), through the <title level="m">Electronic Boethius</title> (Kiernan and Porter 2005) and <title>ARCHway Projects</title> (Kiernan et al. 2004; Kiernan et al. 2005) at the University of Kentucky. We built the EPT using <title level="m">Java</title>, and it operates through the <title level="m">Eclipse</title> platform, benefiting from <title level="m">Eclipse’s</title> open architecture and portability. Currently the <title level="m">EPT</title> runs on <title level="m">Windows XP</title>, <title level="m">Linux</title>, and <title level="m">Mac OS X</title>.
</p>
            <p>   
   The goal of the <title level="m">EPT</title> is to provide software support for building image-based electronic editions of cultural manuscripts. Starting with images and text, the <title level="m">EPT</title> enables the editor to create an electronic edition with complex, pervasive XML encodings, search the electronic edition, link text and images, and deploy the completed electronic edition using filters and XSLT. 
</p>
            <p>   
   A fully functional demo version of the <title level="m">EPT</title> software suite for PC, including sample projects, is available for download at <xptr to="http://rch01.rch.uky.edu/~ept/download"/>. 
</p>
            <p>
               <figure rend="ImageLink">
                  <head>Figure 1. A snapshot of <title level="m">EPT</title> illustrating image-based encoding through <title level="m">ImagText</title>, <title level="m">xMarkup</title>, and <title level="m">xTagger</title> (including an XML view). The figure also shows the Keyboard panel and Search Tool.</head>
                  <p>
                     <xref>poster_178_iacob_1.jpg</xref>
                  </p>
                  <figDesc>Figure 1. A snapshot of <title level="m">EPT</title> illustrating image-based encoding through <title level="m">ImagText</title>, <title level="m">xMarkup</title>, and <title level="m">xTagger</title> (including an XML view). The figure also shows the Keyboard panel and Search Tool.</figDesc>
               </figure>
            </p>
         </div0>
         <div0>
            <head>Editorial Tools on <title level="m">EPT</title> Platform</head>
            <p>
               <list type="unordered">
                  <item>Project wizard initializes an electronic edition project. The input data consists of image files, text content (or partially encoded text) and one or more DTDs (<title level="m">EPT</title> provides support for concurrent markup using multiple DTDs).</item>
                  <item>
                     <title level="m">xMarkup</title>, <title level="m">xTagger</title> and <title level="m">ImagText</title> form the core component for encoding image-based, document-centric XML, working together to link text and image. Through <title level="m">xMarkup</title>, the editor selects edition markup through a series of simple, configurable templates. <title level="m">xTagger</title> introduces markup into the text and provides filtered XML views, while <title level="m">ImagText</title> associates that text section with the corresponding image region, selected by the editor. In summary, the tagging works as follows: the editor selects text and image (in any order), describes the manuscript or textual feature, choosing tags and attribute values through <title level="m">xMarkup</title>, and inserts the markup. See Figure 1 for an illustration of the cooperation between <title level="m">xMarkup</title>, <title level="m">xTagger</title>, and <title level="m">ImagText</title>. The <title level="m">xTagger</title> ensures that the new markup is well-formed and potentially valid (Iacob, Dekhtyar, and Dekhtyar).</item>
                  <item>
                     <title level="m">DucType</title> provides a specialized interface for describing individual manuscript letters. The editor configures <title level="m">DucType</title> through the Letter Template, which also creates and maintains a repository of letter images for a manuscript. The letter images are then used by the <title level="m">DucType</title> tool as base of comparison with any letter image in manuscript image.</item>
                  <item>
                     <title level="m">Overlay</title> provides image manipulation support. An editor may find that multiple images of the same folio are required for a complete view of the manuscript. Using this tool the editor lays one image over another image of the same folio (using, for instance, ultraviolet and normal lightening conditions) and changes the  transparency of the upper layer, enabling a useful comparison of the two images.</item>
                  <item>
                     <title level="m">SaMod</title> is a specialized tool for creating manuscript text collations with text from multiple sources (for example, the same text found in different manuscripts). This tool recognizes differences between transcripts and marks up these differences as variants of the text the editor identifies as the base text.</item>
                  <item>
                     <title level="m">StaTend</title>: Using a transcript marked with basic navigational markup – folio and folio line tags – this tool calculates manuscript statistical tendencies (number of folios, lines per folio, characters per line, etc.). Based on these statistical tendencies the tool reconstructs missing folios for which we can supply the text from another source, based on these statistics. The <title level="m">StaTend</title> tool also includes functionality, called <term>RamSome</term>, for taking these textual <soCalled>virtual folios</soCalled> and translating the text into image, built character by character using letters taken from the manuscript.</item>
                  <item>
                     <title level="m">Quires</title> is a specialized interface for the edition and visualization of codicological markup. It allows the editor to build a virtual map of the physical object. We used this tool in the <title level="m">Electronic Boethius</title> project to reconstruct the gatherings of a manuscript whose binding was destroyed by fire. </item>
                  <item>The Search GUI is an interface for searching the edition. The editor can configure it to search any combination of XML markup, while hiding the intricacies of the query language (an extension of <title level="m">XPath</title> that supports multiple hierarchies).</item>
                  <item>Datalayer is the API for data access in <title level="m">EPT</title>. Tools request and deliver edition data (image and text files, DTDs, etc.) through the Datalayer API, which can interface with a variety of data storage devices, whether a database, file system, or remote server.</item>
                  <item>
                     <title level="m">Glossary</title> is a data-centric XML editor for creating a glossary including each word from the edition text. It automatically generates a complete word list from a transcript file encoded with basic formatting information (folio and folio line markup. The glossary links its entries to the text through the <hi rend="code">&lt;word&gt;</hi> tag – changes made within the edition text are automatically reflected in the glossary. It provides customizable templates for parts of speech and tools for saving the information in XML format (used later on for searching purposes) and HTML format (used for display glossed information).</item>
                  <item>The HTML browser provides HTML display and general browser support in <title level="m">EPT</title>. Having a browser integrated in the platform enables the <title level="m">EPT</title> to direct XSL transformations dynamically to the browser.</item>
                  <item>The Keyboard panel enables the editor to configure keyboards containing special characters (Old English <mentioned>æ</mentioned>,<mentioned>ð</mentioned>, and <mentioned>þ</mentioned>, Greek characters, etc.).</item>
               </list>
            </p>
            <p>In addition to editorial tools, the <title level="m">EPT</title> provides support for project management such as:

   Project properties editor is a GUI for various settings related to the project, such as fonts, encoding, title, etc. It provides support for adding and removing project images and for customizing markup tags, grouping tags in meaningful use categories, assigning aliases to tags and attributes, and adding and removing DTDs from a project.
XML filter allows the editor to create encoding filters for viewing different combinations of elements from the entire set. The output of a filter can be used for visualization, XSL transformation, or data interchange.
Extended XPath search is a search GUI using extended XPath language (an extension of XPath that applies to concurrent markup structures).</p>
            <p>
   From the <title level="m">Eclipse</title> platform, <title level="m">EPT</title> inherits three important features for project development: versioning control (CVS), automatic updates, and help content support. The editing team uses CVS to share project work-in-progress and as projects repository. Updates are useful for providing tools updates as well as bug fixes: an <title level="m">EPT</title> user need only check for updates and download them if available. Finally, the open help architecture enables the editor to create and use help files in such a way that the application help information is added independently of the application program.
   </p>
         </div0>
         <div0>
            <head>Demo overview</head>
            <p>
   Our demonstration will begin with examples of the most basic <title level="m">EPT</title> functionality, and depending on time we will demonstrate any tool or function. We will begin by creating a project and going through the usual operations for preparing an image-based electronic edition: content markup (using only text projections or filtered XML views), automatic linking of images and text, and text updates. We will demonstrate that our document-centric XML editor (<title level="m">xTagger</title>) can significantly simplify and speed up the encoding process. The editor can search for the information, visualize the encodings using customizable filters, or change project properties at any point in the editorial process. We will demonstrate the support for overlapping markup structures by adding/removing DTDs and markup encodings from external files. Depending on the interests of the audience, we can also show how a project can be customized, starting with user interfaces (toolbox, fonts, encodings, etc.) and ending with markup customization: associating aliases to tag elements and attributes, grouping tag elements by functionality, and displaying status bar information based on XPath queries. We will also be prepared to demonstrate <title level="m">Quires</title>, <title level="m">Overlay</title>, and <title level="m">DucType</title>, and show how to customize <title level="m">DucType</title>. Statistical information for the project encodings can be obtained dynamically and we can show how this information can be used in folio reconstruction (text and image) for missing manuscript part. We can also demonstrate <title level="m">SaMod</title>, showing how it collates several different texts.
</p>
            <p>The demo may also include automatic generation of HTML content from edition data (glossaries, manuscript edition and manuscript transcription).
</p>
            <p>
We emphasize during the demonstration how the <title level="m">Eclipse’s</title> open architecture is an excellent platform choice for implementing the <title level="m">EPT</title>.
</p>
         </div0>
      </body>
      <back>
         <div type="Bibliography">
            <head>Bibliography</head>
            <listBibl>
               <biblStruct>
                  <analytic>
                     <author>
                        <name reg="Kiernan, Kevin S.">Kevin S. Kiernan</name>
                     </author>
                     <title level="a">Digital Facsimiles in Editing: Some Guidelines for Editors of Image-based Scholarly Editions</title>
                  </analytic>
                  <monogr>
                     <title level="m">Electronic Textual Editing</title>
                     <imprint>
                        <date>Forthcoming</date>
                     </imprint>
                  </monogr>
                  <note>A volume of essays jointly sponsored by the Modern Language Association and the TEI Consortium, funded by the Mellon Foundation, and co-edited by John Unsworth, Katherine O’Brien O’Keeffe, and Lou Burnard, 2005.</note>
               </biblStruct>
               <biblStruct>
                  <analytic>
                     <author>
                        <name reg="Kiernan, Kevin S.">Kevin S. Kiernan</name>
                     </author>
                     <author>
                        <name reg="Porter, Dorothy C.">Dorothy C. Porter</name>
                     </author>
                     <title level="a">Edition Production Technology (EPT) and the Electronic Boethius Project</title>
                  </analytic>
                  <monogr>
                     <title level="j">DigiCULT</title>
                     <imprint>
                        <date>Forthcoming</date>
                     </imprint>
                  </monogr>
               </biblStruct>
               <biblStruct>
                  <analytic>
                     <author>
                        <name reg="Kiernan, Kevin S.">Kevin S. Kiernan</name>
                     </author>
                     <author>
                        <name reg="Dekhtyar, Alex">Alex Dekhtyar</name>
                     </author>
                     <author>
                        <name reg="Jaromczyk, Jurek">Jurek Jaromczyk</name>
                     </author>
                     <author>
                        <name reg="Porter, Dorothy C.">Dorothy C. Porter</name>
                     </author>
                     <author>
                        <name reg="Iacob, Ionut Emil">Ionut Emil Iacob</name>
                     </author>
                     <title level="a">Edition Production Technology (EPT) and the ARCHway Project</title>
                  </analytic>
                  <monogr>
                     <title level="j">DigiCULT.Info</title>
                     <imprint>
                        <biblScope type="pages">36-38</biblScope>
                        <date value="2004-08">August 2004</date>
                     </imprint>
                  </monogr>
               </biblStruct>
               <biblStruct>
                  <analytic>
                     <author>
                        <name reg="Kiernan, Kevin S.">Kevin S. Kiernan</name>
                     </author>
                     <author>
                        <name reg="Jaromczyk, Jurek">Jurek Jaromczyk</name>
                     </author>
                     <author>
                        <name reg="Dekhtyar, Alex">Alex Dekhtyar</name>
                     </author>
                     <author>
                        <name reg="Porter, Dorothy C.">Dorothy C. Porter</name>
                     </author>
                     <author>
                        <name reg="Hawley, Kenneth">Kenneth Hawley</name>
                     </author>
                     <author>
                        <name reg="Bodapati, Sandeep">Sandeep Bodapati</name>
                     </author>
                     <author>
                        <name reg="Iacob, Ionut Emil">Ionut Emil Iacob</name>
                     </author>
                     <title level="a">The ARCHway Project: Architecture for Research in Computing for Humanities through Research, Teaching, and Learning</title>
                  </analytic>
                  <monogr>
                     <title level="j">Literary and Linguistic Computing</title>
                     <imprint>
                        <date>Forthcoming</date>
                     </imprint>
                  </monogr>
                  <note>Special issue, papers from Joint International Conference of the Association for Computers and the Humanities and the Association for Literary and Linguistic Computing, 2003</note>
               </biblStruct>
               <biblStruct>
                  <analytic>
                     <author>
                        <name reg="Iacob, Ionut Emil">Ionut Emil Iacob</name>
                     </author>
                     <author>
                        <name reg="Dekhtyar, Alex">Alex Dekhtyar</name>
                     </author>
                     <author>
                        <name reg="Dekhtyar, Michael I.">Michael I. Dekhtyar</name>
                     </author>
                     <title level="a">Checking Potential Validity of XML Documents</title>
                  </analytic>
                  <monogr>
                     <title level="m">Proceedings, Seventh International Workshop on the Web and Databases, WebDB@SIGMOD/PODS</title>
                     <imprint>
                        <date value="2004">2004</date>
                        <biblScope type="pages">91-96</biblScope>
                     </imprint>
                  </monogr>
               </biblStruct>
            </listBibl>
         </div>
      </back>
   </text>
</TEI.2>