Matches in SemOpenAlex for { <https://semopenalex.org/work/W2005266950> ?p ?o ?g. }
- W2005266950 endingPage "846" @default.
- W2005266950 startingPage "827" @default.
- W2005266950 abstract "This paper proposes a fully automated information extraction methodology for weblogs. The methodology integrates a set of relevant approaches based on the use of web feeds and processing of HTML for the extraction of weblog properties. The approach includes a model for generating a wrapper that exploits web feeds for deriving a set of extraction rules automatically. Instead of performing a pairwise comparison between posts, the model matches the values of the web feeds against their corresponding HTML elements retrieved from multiple weblog posts. It adopts a probabilistic approach for deriving a set of rules and automating the process of wrapper generation. An evaluation of the model is conducted on a collection of weblogs reporting a prediction accuracy of 89 %. The results of this evaluation show that the proposed technique enables robust extraction of weblog properties and can be applied across the blogosphere." @default.
- W2005266950 created "2016-06-24" @default.
- W2005266950 creator A5012585972 @default.
- W2005266950 creator A5031364513 @default.
- W2005266950 creator A5034125179 @default.
- W2005266950 creator A5068475403 @default.
- W2005266950 date "2013-11-21" @default.
- W2005266950 modified "2023-09-26" @default.
- W2005266950 title "Entropy-based automated wrapper generation for weblog data extraction" @default.
- W2005266950 cites W11750719 @default.
- W2005266950 cites W1542149162 @default.
- W2005266950 cites W1616576116 @default.
- W2005266950 cites W1927338256 @default.
- W2005266950 cites W197497516 @default.
- W2005266950 cites W2005646337 @default.
- W2005266950 cites W2120101509 @default.
- W2005266950 cites W2135397824 @default.
- W2005266950 cites W2135479443 @default.
- W2005266950 cites W2143309843 @default.
- W2005266950 cites W2156279557 @default.
- W2005266950 cites W2157140910 @default.
- W2005266950 cites W2166994378 @default.
- W2005266950 cites W2548007011 @default.
- W2005266950 cites W3006373977 @default.
- W2005266950 cites W3146259567 @default.
- W2005266950 cites W4230980612 @default.
- W2005266950 doi "https://doi.org/10.1007/s11280-013-0269-6" @default.
- W2005266950 hasPublicationYear "2013" @default.
- W2005266950 type Work @default.
- W2005266950 sameAs 2005266950 @default.
- W2005266950 citedByCount "1" @default.
- W2005266950 countsByYear W20052669502015 @default.
- W2005266950 crossrefType "journal-article" @default.
- W2005266950 hasAuthorship W2005266950A5012585972 @default.
- W2005266950 hasAuthorship W2005266950A5031364513 @default.
- W2005266950 hasAuthorship W2005266950A5034125179 @default.
- W2005266950 hasAuthorship W2005266950A5068475403 @default.
- W2005266950 hasBestOaLocation W20052669502 @default.
- W2005266950 hasConcept C106301342 @default.
- W2005266950 hasConcept C110875604 @default.
- W2005266950 hasConcept C111919701 @default.
- W2005266950 hasConcept C121332964 @default.
- W2005266950 hasConcept C124101348 @default.
- W2005266950 hasConcept C136764020 @default.
- W2005266950 hasConcept C154945302 @default.
- W2005266950 hasConcept C165696696 @default.
- W2005266950 hasConcept C177264268 @default.
- W2005266950 hasConcept C184898388 @default.
- W2005266950 hasConcept C195807954 @default.
- W2005266950 hasConcept C199360897 @default.
- W2005266950 hasConcept C21959979 @default.
- W2005266950 hasConcept C23123220 @default.
- W2005266950 hasConcept C2779661781 @default.
- W2005266950 hasConcept C38652104 @default.
- W2005266950 hasConcept C41008148 @default.
- W2005266950 hasConcept C49937458 @default.
- W2005266950 hasConcept C62520636 @default.
- W2005266950 hasConcept C81639021 @default.
- W2005266950 hasConcept C98045186 @default.
- W2005266950 hasConceptScore W2005266950C106301342 @default.
- W2005266950 hasConceptScore W2005266950C110875604 @default.
- W2005266950 hasConceptScore W2005266950C111919701 @default.
- W2005266950 hasConceptScore W2005266950C121332964 @default.
- W2005266950 hasConceptScore W2005266950C124101348 @default.
- W2005266950 hasConceptScore W2005266950C136764020 @default.
- W2005266950 hasConceptScore W2005266950C154945302 @default.
- W2005266950 hasConceptScore W2005266950C165696696 @default.
- W2005266950 hasConceptScore W2005266950C177264268 @default.
- W2005266950 hasConceptScore W2005266950C184898388 @default.
- W2005266950 hasConceptScore W2005266950C195807954 @default.
- W2005266950 hasConceptScore W2005266950C199360897 @default.
- W2005266950 hasConceptScore W2005266950C21959979 @default.
- W2005266950 hasConceptScore W2005266950C23123220 @default.
- W2005266950 hasConceptScore W2005266950C2779661781 @default.
- W2005266950 hasConceptScore W2005266950C38652104 @default.
- W2005266950 hasConceptScore W2005266950C41008148 @default.
- W2005266950 hasConceptScore W2005266950C49937458 @default.
- W2005266950 hasConceptScore W2005266950C62520636 @default.
- W2005266950 hasConceptScore W2005266950C81639021 @default.
- W2005266950 hasConceptScore W2005266950C98045186 @default.
- W2005266950 hasIssue "4" @default.
- W2005266950 hasLocation W20052669501 @default.
- W2005266950 hasLocation W20052669502 @default.
- W2005266950 hasLocation W20052669503 @default.
- W2005266950 hasLocation W20052669504 @default.
- W2005266950 hasOpenAccess W2005266950 @default.
- W2005266950 hasPrimaryLocation W20052669501 @default.
- W2005266950 hasRelatedWork W1548492051 @default.
- W2005266950 hasRelatedWork W1788528807 @default.
- W2005266950 hasRelatedWork W1822441068 @default.
- W2005266950 hasRelatedWork W2151311386 @default.
- W2005266950 hasRelatedWork W2348792274 @default.
- W2005266950 hasRelatedWork W2350681646 @default.
- W2005266950 hasRelatedWork W2373481072 @default.
- W2005266950 hasRelatedWork W2389364963 @default.
- W2005266950 hasRelatedWork W2411679502 @default.
- W2005266950 hasRelatedWork W2800975405 @default.
- W2005266950 hasVolume "17" @default.