@inproceedings{scholars658, year = {2009}, journal = {2009 WRI World Congress on Computer Science and Information Engineering, CSIE 2009}, pages = {149--153}, volume = {5}, note = {cited By 0; Conference of 2009 WRI World Congress on Computer Science and Information Engineering, CSIE 2009 ; Conference Date: 31 March 2009 Through 2 April 2009; Conference Code:78368}, doi = {10.1109/CSIE.2009.661}, title = {Information extraction using Link Grammar}, address = {Los Angeles, CA}, author = {Zamin, N.}, isbn = {9780769535074}, keywords = {AS-links; Database construction; Database entry; Factual knowledge; Health safety; Information extraction; Link grammar; Literature search; Malaysia; Natural language processing; Operating units; Operation and maintenance; PETRONAS; Scientific texts; Terrorism attack, Computational linguistics; Computer science; Database systems; Information analysis; Mining, Natural language processing systems}, url = {https://www.scopus.com/inward/record.uri?eid=2-s2.0-71049144486&doi=10.1109\%2fCSIE.2009.661&partnerID=40&md5=7bceced2f606ba925dda0734a5249f03}, abstract = {In the last few years, Information Extraction (IE) has become a rapidly expanding field as the machine-readable documents keep growing exponentially. IE is the perfect solution to transform factual knowledge from publications into database entries. Many efforts have been made to automatically extract and mine scientific texts ranging from biochemical to terrorism attacks reports. This study is looking into the opportunity to extract important facts from the PETRONAS Health Safety and Environment (HSE) reports for database construction and analysis purpose. The reports are currently managed by PETRONAS Group HSE in Malaysia which contain the information on incidents and accidents occurred during the design, construction, operation and maintenance by all the PETRONAS Operating Units locally and worldwide. The effort to automate PETRONAS HSE reports will greatly benefit the PETRONAS Group HSE to automatically populate the database entries in which traditionally the task is arduous and time consuming. Many algorithms have been reported for IE ranging from simple statistical methods to advanced Natural language Processing (NLP) methods. This study investigates one of the NLP approach known as Link Grammar1 (LG) for extracting relevant information. LG appears within limited literature search to be the most suitable candidate algorithm. However, an exhaustive literature search will reveal the algorithm best suited to this application work. {\^A}{\copyright} 2008 IEEE.} }