{"refrec":{"BRefID":290118,"RR":"<b>Tharatipyakul, A.; Numnark, S.; Wichadakul, D.; Ingsriswang, S.</b> (2012). ChemEx: information extraction system for chemical data curation. <i>BMC Bioinformatics 13(Suppl 17)</i>: S9. <a href=\"https://dx.doi.org/10.1186/1471-2105-13-S17-S9\" target=\"_blank\">https://dx.doi.org/10.1186/1471-2105-13-S17-S9</a>","BEntID":282158,"PublicFlag":1,"CheckedFlag":1,"wosflag":1,"vabbflag":1,"RefStringPartII":". <i>BMC Bioinformatics 13(Suppl 17)</i>: S9. <a href=\"https://dx.doi.org/10.1186/1471-2105-13-S17-S9\" target=\"_blank\">https://dx.doi.org/10.1186/1471-2105-13-S17-S9</a>","DocTypID":8,"DocType":"Journal article","MarineFlag":0,"FreshFlag":0,"BrackishFlag":0,"TerrestrialFlag":0,"Authorstring":"Tharatipyakul, A.; Numnark, S.; Wichadakul, D.; Ingsriswang, S.","OrigTitleTranslFlag":0,"Authorstringtrunc":"Tharatipyakul, A. <i>et al.</i>","Englishabstract":"BackgroundManual chemical data curation from publications is error-prone, time consuming, and hard to maintain up-to-date data sets. Automatic information extraction can be used as a tool to reduce these problems. Since chemical structures usually described in images, information extraction needs to combine structure image recognition and text mining together.ResultsWe have developed ChemEx, a chemical information extraction system. ChemEx processes both text and images in publications. Text annotator is able to extract compound, organism, and assay entities from text content while structure image recognition enables translation of chemical raster images to machine readable format. A user can view annotated text along with summarized information of compounds, organism that produces those compounds, and assay tests.ConclusionsChemEx facilitates and speeds up chemical data curation by extracting compounds, organisms, and assays from a large collection of publications. The software and corpus can be downloaded from http://www.biotec.or.th/isl/ChemEx.","AbstractOtherLang":null,"BibLvlCode":"AS","StandardTitle":"ChemEx: information extraction system for chemical data curation","OrigTitleLangCode":"en","OrigTitleLangCodeExtended":"eng","OrigTitleLangID":15,"DateLastModified":{"date":"2024-12-10 01:33:17.368041","timezone_type":1,"timezone":"+01:00"},"UserAccessRight":null,"UserAccID":null,"AuthorKeywords":null,"OtherDescriptors":null,"Notes":null,"AnaPub":2012,"MonPub":null,"DateUpdate":"2018-02-13","DateCreate":"2017-10-19","SecASFANote":null,"ConfID":null,"PeerRev":1,"VlizCoreFlag":1,"WoScode":"WOS:000312985100009","VABBcode":null,"OpenAcc":1,"DOI":"10.1186/1471-2105-13-S17-S9"},"refs":null,"anarec":{"AnaID":290118,"PubliDate":2012,"Pagination":"S9","XtraPublOfAnaID":null,"ISBN":null,"Volume":"13","Issue":"Suppl 17","BRefMon":null,"BRefMonRR":null,"BRefXtra":null,"BRefXtraRR":null,"SerBRefID":253411,"SerRR":"BMC Bioinformatics. BioMed Central: London.  e-ISSN 1471-2105","StandardTitleSer":"BMC Bioinformatics","ISSN":null,"AbbrevSer":null,"StandardTitleMon":null,"StartPage":null,"Pages":null,"ToPubliDate":null,"BRefBibLvlCode":"S","SerNotes":null},"monrec":null,"serrec":null,"relations":null,"relationsRev":null,"addrec":null,"othpubs":null,"ownerships":null,"authors":[{"AutName":"Tharatipyakul","Firstname":"Atima","Initials":"A.","Affiliation":"Natl Ctr Genet Engn & Biotechnol BIOTEC, Informat Syst Lab, Klongluang, Pathumthani, Thailand.","Discriminator":null,"CorporateFlag":0,"BEntID":282158,"AutID":310412,"OrderNr":1,"DegrID":null,"EditorFlag":0,"CorrespFlag":0,"IllustratorFlag":0,"ReviserFlag":0,"TranslatorFlag":0,"InsAcronym":null,"InsFSN":null,"ORCID":null,"PersID":null,"InsID":null},{"AutName":"Numnark","Firstname":"Somrak","Initials":"S.","Affiliation":"Natl Ctr Genet Engn & Biotechnol BIOTEC, Informat Syst Lab, Klongluang, Pathumthani, Thailand.","Discriminator":null,"CorporateFlag":0,"BEntID":282158,"AutID":310413,"OrderNr":2,"DegrID":null,"EditorFlag":0,"CorrespFlag":0,"IllustratorFlag":0,"ReviserFlag":0,"TranslatorFlag":0,"InsAcronym":null,"InsFSN":null,"ORCID":null,"PersID":null,"InsID":null},{"AutName":"Wichadakul","Firstname":"Duangdao","Initials":"D.","Affiliation":"Natl Ctr Genet Engn & Biotechnol BIOTEC, Informat Syst Lab, Klongluang, Pathumthani, Thailand.","Discriminator":null,"CorporateFlag":0,"BEntID":282158,"AutID":310414,"OrderNr":3,"DegrID":null,"EditorFlag":0,"CorrespFlag":0,"IllustratorFlag":0,"ReviserFlag":0,"TranslatorFlag":0,"InsAcronym":null,"InsFSN":null,"ORCID":null,"PersID":null,"InsID":null},{"AutName":"Ingsriswang","Firstname":"Supawadee","Initials":"S.","Affiliation":"Natl Ctr Genet Engn & Biotechnol BIOTEC, Informat Syst Lab, Klongluang, Pathumthani, Thailand.","Discriminator":null,"CorporateFlag":0,"BEntID":282158,"AutID":310415,"OrderNr":4,"DegrID":null,"EditorFlag":0,"CorrespFlag":0,"IllustratorFlag":0,"ReviserFlag":0,"TranslatorFlag":0,"InsAcronym":null,"InsFSN":null,"ORCID":null,"PersID":null,"InsID":null}],"mapdetails":null,"datasets":null,"monographs":null,"monparts":null,"serparts":null,"BEntOpen":null,"BEntPrivate":null,"availability":[{"BInstID":308040,"LibID":36,"BRefID":290118,"EmbargoDate":null,"FullEmbargoDate":null,"PhysMedID":16,"hasOCRd":1,"ShelfLocCode":"308040","RFID":null,"PaidValue":null,"Medium":"Server","Description":"VLIZ Open Access","Acronym":"VLIZ","Library":"Vlaams Instituut voor de Zee","DutchTerm":"Open access","URL":null,"ClassifID":53,"Classification":"Open access","ReqLink":null,"ClassifTypID":1,"URLLocation":"https://www.vliz.be/imisdocs/publications/","SubDir":null,"InternalReq":0,"LoggedInReq":0,"Disclaimer":null,"DutchDisclaimer":null,"FileFormat":".pdf","FileDescr":"pdf","InsPub":1,"InsID":36,"FileFormID":6,"LendableFlag":1,"PublicFlag":1,"orderLib":"A","Notes":null,"AccConID":null,"AccessConstraint":null,"LicURL":null}],"litstyles":null,"thespers":null,"arch2discl":null,"SERpubls":[{"PublName":"BioMed Central","City":"London"}],"MONpubls":null,"pictures":[],"thestermsPath":null,"thestermsASFA":null,"taxtermsASFA":null,"geotermsASFA":null,"collections":null,"conf":null,"proj":null,"Physdatasets":null,"spcols":{"955":{"SpName":"Catalogue of Life acknowledged","SpColID":955,"ParSpColID":null,"TopParID":null,"ShortName":"Catalogue of Life ackn","URLLocation":null,"LibID":36,"OpenRepoFlag":null,"SpTypID":null,"TopParIDNotWebsite":null,"SpColPath":"Catalogue of Life ackn"}},"doi":null,"publs":null,"serparttypes":null,"monauthors":null,"MParts":null,"SParts":null,"hLibs":null,"langs":[{"BEntID":282158,"AbstractFlag":0,"LangID":15,"LangCode":"en","Lang":"English","DutchTerm":"Engels","LangCodeExtended":"eng"},{"BEntID":282158,"AbstractFlag":1,"LangID":15,"LangCode":"en","Lang":"English","DutchTerm":"Engels","LangCodeExtended":"eng"}],"urls":[{"URL":"https://dx.doi.org/10.1186/1471-2105-13-S17-S9","externalID":"10.1186/1471-2105-13-S17-S9","URLTypeCode":"DOI","URLID":60737,"URLTypID":13,"URLType":"DOI","URLPrefix":"http://dx.doi.org/"}],"thesterms":null,"taxterms":null,"geoterms":null,"othterms":null,"asfacodes":null,"asfa2codes":null,"thestermsFRIS":null,"taxtermsFRIS":null,"geotermsFRIS":null,"othtermsFRIS":null,"resmessage":"","complete":1,"sessions":{"newSesName":"Bouchti, Zohra, Z.","newSesDate":{"date":"2017-10-19 08:22:28.153000","timezone_type":3,"timezone":"Europe/Brussels"},"updSesName":"Lyssens, Liesbeth, L.","updSesDate":{"date":"2018-02-13 19:34:46.407000","timezone_type":3,"timezone":"Europe/Brussels"}}}
