dc.creator | Sleiman, Hassan A. | es |
dc.creator | Corchuelo Gil, Rafael | es |
dc.date.accessioned | 2023-03-30T09:53:03Z | |
dc.date.available | 2023-03-30T09:53:03Z | |
dc.date.issued | 2012-07 | |
dc.identifier.citation | Sleiman, H.A. y Corchuelo Gil, R. (2012). Towards a Method for Unsupervised Web Information Extraction. En 12th International Conference: Web Engineering (ICWE 2012) (427-430), Berlín (Alemania): Springer. | |
dc.identifier.isbn | 978-3-642-31752-1 (impreso) | es |
dc.identifier.isbn | 978-3-642-31753-8 (online) | es |
dc.identifier.uri | https://hdl.handle.net/11441/143724 | |
dc.description.abstract | The literature provides a variety of techniques to build the information extractors on which some data integration systems rely. In formation extraction techniques are usually based on extraction rules that require maintenance and adaptation if web sources change. We present our preliminary steps towards an unsupervised information ex traction technique that searches web documents for shared patterns and fragments them until finding the relevant information that should be ex tracted. Experimental results on 1230 real-web documents demonstrate that our system performs fast and achieves promising results. | es |
dc.description.sponsorship | Ministerio de Ciencia y Tecnología TIN2007-64119 | es |
dc.description.sponsorship | Junta de Andalucía P07-TIC-2602 | es |
dc.description.sponsorship | Junta de Andalucía P08- TIC-4100 | es |
dc.description.sponsorship | Ministerio de Ciencia e Innovación TIN2008-04718-E | es |
dc.description.sponsorship | Ministerio de Ciencia e Innovación TIN2010- 21744 | es |
dc.description.sponsorship | Ministerio de Economía, Industria y Competitividad TIN2010-09809-E | es |
dc.description.sponsorship | Ministerio de Ciencia e Innovación TIN2010-10811-E | es |
dc.description.sponsorship | Ministerio de Ciencia e Innovación TIN2010-09988-E | es |
dc.format | application/pdf | es |
dc.format.extent | 4 | es |
dc.language.iso | eng | es |
dc.publisher | Springer | es |
dc.relation.ispartof | 12th International Conference: Web Engineering (ICWE 2012) (2012), pp. 427-430. | |
dc.rights | Attribution-NonCommercial-NoDerivatives 4.0 Internacional | * |
dc.rights.uri | http://creativecommons.org/licenses/by-nc-nd/4.0/ | * |
dc.subject | Web Information Extraction | es |
dc.subject | Unsupervised Technique | es |
dc.title | Towards a Method for Unsupervised Web Information Extraction | es |
dc.type | info:eu-repo/semantics/conferenceObject | es |
dcterms.identifier | https://ror.org/03yxnpp24 | |
dc.type.version | info:eu-repo/semantics/publishedVersion | es |
dc.rights.accessRights | info:eu-repo/semantics/openAccess | es |
dc.contributor.affiliation | Universidad de Sevilla. Departamento de Lenguajes y Sistemas Informáticos | es |
dc.relation.projectID | TIN2007-64119 | es |
dc.relation.projectID | P07-TIC-2602 | es |
dc.relation.projectID | P08- TIC-4100 | es |
dc.relation.projectID | TIN2008-04718-E | es |
dc.relation.projectID | TIN2010- 21744 | es |
dc.relation.projectID | TIN2010-09809-E | es |
dc.relation.projectID | TIN2010-10811-E | es |
dc.relation.projectID | TIN2010-09988-E | es |
dc.relation.publisherversion | https://link.springer.com/chapter/10.1007/978-3-642-31753-8_36 | es |
dc.identifier.doi | 10.1007/978-3-642-31753-8_36 | es |
dc.publication.initialPage | 427 | es |
dc.publication.endPage | 430 | es |
dc.eventtitle | 12th International Conference: Web Engineering (ICWE 2012) | es |
dc.eventinstitution | Berlín (Alemania) | es |
dc.relation.publicationplace | Berlin, Germany | es |
dc.contributor.funder | Ministerio de Ciencia y Tecnología (MCYT). España | es |
dc.contributor.funder | Junta de Andalucía | es |
dc.contributor.funder | Ministerio de Ciencia e Innovación (MICIN). España | es |
dc.contributor.funder | Ministerio de Economía, Industria y Competitividad | es |