{"refrec":{"BRefID":292308,"RR":"<b>Willis, A.; King, D.; Morse, D.; Dil, A.; Lyal, C.; Roberts, D.</b> (2010). From XML to XML: the why and how of making the biodiversity literature accessible to researchers, <b><i>in</i></b>: Calzolari, N. <i>et al.</i> <i>Proceedings of the International Conference on Language Resources and Evaluation, LREC 2010, 17-23 May 2010, Valletta, Malta.</i> pp. 1-8","BEntID":284360,"PublicFlag":1,"CheckedFlag":0,"wosflag":null,"vabbflag":null,"RefStringPartII":", <b><i>in</i></b>: Calzolari, N. <i>et al.</i> <i>Proceedings of the International Conference on Language Resources and Evaluation, LREC 2010, 17-23 May 2010, Valletta, Malta.</i> pp. 1-8","DocTypID":17,"DocType":"Book chapters","MarineFlag":0,"FreshFlag":0,"BrackishFlag":0,"TerrestrialFlag":0,"Authorstring":"Willis, A.; King, D.; Morse, D.; Dil, A.; Lyal, C.; Roberts, D.","OrigTitleTranslFlag":0,"Authorstringtrunc":"Willis, A. <i>et al.</i>","Englishabstract":"We present the ABLE document collection, which consists of a set of annotated volumes of the Bulletin of the British Museum (Natural History). These were developed during our ongoing work on automating the markup of scanned copies of the biodiversity literature. Such automation is required if historic literature is to be used to inform contemporary issues in biodiversity research. We consider an enhanced TEI XML markup language, which is used as an intermediate stage in translating from the initial XML obtained from Optical Character Recognition to taXMLit, the target annotation schema. The intermediate representation allows additional information from external sources such as a taxonomic thesaurus to be incorporated before the final translation into taXMLit. We give an overview of the project workflow in automating the markup process, and consider what extensions to existing markup schema will be required to best support working taxonomists. Finally, we discuss some of the particular issues which were encountered in converting between different XML formats.","AbstractOtherLang":null,"BibLvlCode":"AM","StandardTitle":"From XML to XML: the why and how of making the biodiversity literature accessible to researchers","OrigTitleLangCode":"en","OrigTitleLangCodeExtended":"eng","OrigTitleLangID":15,"DateLastModified":{"date":"2024-12-10 01:33:17.368041","timezone_type":1,"timezone":"+01:00"},"UserAccessRight":null,"UserAccID":null,"AuthorKeywords":null,"OtherDescriptors":null,"Notes":null,"AnaPub":2010,"MonPub":null,"DateUpdate":"2018-01-31","DateCreate":"2018-01-31","SecASFANote":null,"ConfID":null,"PeerRev":0,"VlizCoreFlag":1,"WoScode":null,"VABBcode":null,"OpenAcc":0},"refs":null,"anarec":{"AnaID":292308,"PubliDate":2010,"Pagination":"1-8","XtraPublOfAnaID":null,"ISBN":"2-9517408-6-7","Volume":null,"Issue":null,"BRefMon":292307,"BRefMonRR":"<b>Calzolari, N. <i>et al.</i></b> (2010). Proceedings of the International Conference on Language Resources and Evaluation, LREC 2010, 17-23 May 2010, Valletta, Malta. European Language Resources Association: France. ISBN 2-9517408-6-7. ","BRefXtra":null,"BRefXtraRR":null,"SerBRefID":null,"SerRR":null,"StandardTitleSer":null,"ISSN":null,"AbbrevSer":null,"StandardTitleMon":"Proceedings of the International Conference on Language Resources and Evaluation, LREC 2010, 17-23 May 2010, Valletta, Malta","StartPage":1,"Pages":8,"ToPubliDate":null,"BRefBibLvlCode":"M","SerNotes":null,"AutString":"Calzolari, N. <i>et al.</i>"},"monrec":null,"serrec":null,"relations":null,"relationsRev":null,"addrec":null,"othpubs":null,"ownerships":null,"authors":[{"AutName":"Willis","Firstname":"Alistair","Initials":"A.","Affiliation":null,"Discriminator":null,"CorporateFlag":0,"BEntID":284360,"AutID":291021,"OrderNr":1,"DegrID":null,"EditorFlag":0,"CorrespFlag":0,"IllustratorFlag":0,"ReviserFlag":0,"TranslatorFlag":0,"InsAcronym":null,"InsFSN":null,"ORCID":null,"PersID":null,"InsID":null},{"AutName":"King","Firstname":"David","Initials":"D.","Affiliation":null,"Discriminator":null,"CorporateFlag":0,"BEntID":284360,"AutID":290961,"OrderNr":2,"DegrID":null,"EditorFlag":0,"CorrespFlag":0,"IllustratorFlag":0,"ReviserFlag":0,"TranslatorFlag":0,"InsAcronym":null,"InsFSN":null,"ORCID":null,"PersID":null,"InsID":null},{"AutName":"Morse","Firstname":"David","Initials":"D.","Affiliation":null,"Discriminator":null,"CorporateFlag":0,"BEntID":284360,"AutID":58082,"OrderNr":3,"DegrID":null,"EditorFlag":0,"CorrespFlag":0,"IllustratorFlag":0,"ReviserFlag":0,"TranslatorFlag":0,"InsAcronym":null,"InsFSN":null,"ORCID":null,"PersID":null,"InsID":null},{"AutName":"Dil","Firstname":"Anton","Initials":"A.","Affiliation":null,"Discriminator":null,"CorporateFlag":0,"BEntID":284360,"AutID":291022,"OrderNr":4,"DegrID":null,"EditorFlag":0,"CorrespFlag":0,"IllustratorFlag":0,"ReviserFlag":0,"TranslatorFlag":0,"InsAcronym":null,"InsFSN":null,"ORCID":null,"PersID":null,"InsID":null},{"AutName":"Lyal","Firstname":"Chris","Initials":"C.","Affiliation":null,"Discriminator":null,"CorporateFlag":0,"BEntID":284360,"AutID":210438,"OrderNr":5,"DegrID":null,"EditorFlag":0,"CorrespFlag":0,"IllustratorFlag":0,"ReviserFlag":0,"TranslatorFlag":0,"InsAcronym":null,"InsFSN":null,"ORCID":null,"PersID":null,"InsID":null},{"AutName":"Roberts","Firstname":"Dave","Initials":"D.","Affiliation":null,"Discriminator":null,"CorporateFlag":0,"BEntID":284360,"AutID":264773,"OrderNr":6,"DegrID":null,"EditorFlag":0,"CorrespFlag":0,"IllustratorFlag":0,"ReviserFlag":0,"TranslatorFlag":0,"InsAcronym":null,"InsFSN":null,"ORCID":null,"PersID":null,"InsID":null}],"mapdetails":null,"datasets":null,"monographs":null,"monparts":null,"serparts":null,"BEntOpen":null,"BEntPrivate":null,"availability":[{"BInstID":310492,"LibID":36,"BRefID":292308,"EmbargoDate":null,"FullEmbargoDate":null,"PhysMedID":16,"hasOCRd":null,"ShelfLocCode":"310492","RFID":null,"PaidValue":null,"Medium":"Server","Description":"Interne VLIZ documenten","Acronym":"VLIZ","Library":"Vlaams Instituut voor de Zee","DutchTerm":"Non-open access","URL":null,"ClassifID":228,"Classification":"Non-open access","ReqLink":1,"ClassifTypID":3,"URLLocation":"https://www.vliz.be/imisdocs/publications/","SubDir":1,"InternalReq":1,"LoggedInReq":1,"Disclaimer":"Disclaimer_VLIZ_Intern","DutchDisclaimer":"<p>Deze publicatie is enkel beschikbaar voor persoonlijk gebruik binnen de Innovocean site <br />en mag op geen enkele manier verder worden verspreid.</p>","FileFormat":".pdf","FileDescr":"pdf","InsPub":1,"InsID":36,"FileFormID":6,"LendableFlag":1,"PublicFlag":1,"orderLib":"A","Notes":null,"AccConID":null,"AccessConstraint":null,"LicURL":null}],"litstyles":[{"LitStyID":3,"Style":"Conference paper"}],"thespers":null,"arch2discl":null,"SERpubls":null,"MONpubls":[{"PublName":"European Language Resources Association","Place":"France"}],"pictures":[],"thestermsPath":null,"thestermsASFA":null,"taxtermsASFA":null,"geotermsASFA":null,"collections":null,"conf":null,"proj":null,"Physdatasets":null,"spcols":{"955":{"SpName":"Catalogue of Life acknowledged","SpColID":955,"ParSpColID":null,"TopParID":null,"ShortName":"Catalogue of Life ackn","URLLocation":null,"LibID":36,"OpenRepoFlag":null,"SpTypID":null,"TopParIDNotWebsite":null,"SpColPath":"Catalogue of Life ackn"}},"doi":null,"publs":null,"serparttypes":null,"monauthors":[{"AutName":"Calzolari","Initials":"N.","CorporateFlag":0,"BEntID":284359,"AutID":291013,"OrderNr":1,"DegrID":null,"EditorFlag":0,"CorrespFlag":0,"IllustratorFlag":0,"ReviserFlag":0,"TranslatorFlag":0,"AutStrTrunc":"Calzolari, N. <i>et al.</i>"},{"AutName":"Choukri","Initials":"K.","CorporateFlag":0,"BEntID":284359,"AutID":291014,"OrderNr":2,"DegrID":null,"EditorFlag":0,"CorrespFlag":0,"IllustratorFlag":0,"ReviserFlag":0,"TranslatorFlag":0,"AutStrTrunc":"Calzolari, N. <i>et al.</i>"},{"AutName":"Maegaard","Initials":"B.","CorporateFlag":0,"BEntID":284359,"AutID":291015,"OrderNr":3,"DegrID":null,"EditorFlag":0,"CorrespFlag":0,"IllustratorFlag":0,"ReviserFlag":0,"TranslatorFlag":0,"AutStrTrunc":"Calzolari, N. <i>et al.</i>"},{"AutName":"Mariani","Initials":"J.","CorporateFlag":0,"BEntID":284359,"AutID":291016,"OrderNr":4,"DegrID":null,"EditorFlag":0,"CorrespFlag":0,"IllustratorFlag":0,"ReviserFlag":0,"TranslatorFlag":0,"AutStrTrunc":"Calzolari, N. <i>et al.</i>"},{"AutName":"Odijk","Initials":"J.","CorporateFlag":0,"BEntID":284359,"AutID":291017,"OrderNr":5,"DegrID":null,"EditorFlag":0,"CorrespFlag":0,"IllustratorFlag":0,"ReviserFlag":0,"TranslatorFlag":0,"AutStrTrunc":"Calzolari, N. <i>et al.</i>"},{"AutName":"Piperidis","Initials":"S.","CorporateFlag":0,"BEntID":284359,"AutID":291018,"OrderNr":6,"DegrID":null,"EditorFlag":0,"CorrespFlag":0,"IllustratorFlag":0,"ReviserFlag":0,"TranslatorFlag":0,"AutStrTrunc":"Calzolari, N. <i>et al.</i>"},{"AutName":"Rosner","Initials":"M.","CorporateFlag":0,"BEntID":284359,"AutID":291019,"OrderNr":7,"DegrID":null,"EditorFlag":0,"CorrespFlag":0,"IllustratorFlag":0,"ReviserFlag":0,"TranslatorFlag":0,"AutStrTrunc":"Calzolari, N. <i>et al.</i>"},{"AutName":"Tapias","Initials":"D.","CorporateFlag":0,"BEntID":284359,"AutID":291020,"OrderNr":8,"DegrID":null,"EditorFlag":0,"CorrespFlag":0,"IllustratorFlag":0,"ReviserFlag":0,"TranslatorFlag":0,"AutStrTrunc":"Calzolari, N. <i>et al.</i>"}],"MParts":null,"SParts":null,"hLibs":null,"langs":[{"BEntID":284360,"AbstractFlag":0,"LangID":15,"LangCode":"en","Lang":"English","DutchTerm":"Engels","LangCodeExtended":"eng"},{"BEntID":284360,"AbstractFlag":1,"LangID":15,"LangCode":"en","Lang":"English","DutchTerm":"Engels","LangCodeExtended":"eng"}],"urls":null,"thesterms":null,"taxterms":null,"geoterms":null,"othterms":null,"asfacodes":null,"asfa2codes":null,"thestermsFRIS":null,"taxtermsFRIS":null,"geotermsFRIS":null,"othtermsFRIS":null,"resmessage":"","complete":1,"sessions":{"newSesName":"Bouchti, Zohra, Z.","newSesDate":{"date":"2018-01-31 08:46:03.743000","timezone_type":3,"timezone":"Europe/Brussels"},"updSesName":"Bouchti, Zohra, Z.","updSesDate":{"date":"2018-01-31 08:46:03.743000","timezone_type":3,"timezone":"Europe/Brussels"}}}
