Matches in SemOpenAlex for { <https://semopenalex.org/work/W200042785> ?p ?o ?g. }
Showing items 1 to 88 of
88
with 100 items per page.
- W200042785 endingPage "583" @default.
- W200042785 startingPage "577" @default.
- W200042785 abstract "Recent work in machine learning for information extraction has focused on two distinct sub-problems: the conventional problem of filling template slots from natural language text, and the problem of wrapper induction, learning simple extraction procedures (“wrappers”) for highly structured text such as Web pages produced by CGI scripts. For suitably regular domains, existing wrapper induction algorithms can efficiently learn wrappers that are simple and highly accurate, but the regularity bias of these algorithms makes them unsuitable for most conventional information extraction tasks. Boosting is a technique for improving the performance of a simple machine learning algorithm by repeatedly applying it to the training set with different example weightings. We describe an algorithm that learns simple, low-coverage wrapper-like extraction patterns, which we then apply to conventional information extraction problems using boosting. The result is BWI, a trainable information extraction system with a strong precision bias and F1 performance better than state-of-the-art techniques in many domains." @default.
- W200042785 created "2016-06-24" @default.
- W200042785 creator A5051886728 @default.
- W200042785 creator A5080437721 @default.
- W200042785 date "2000-07-30" @default.
- W200042785 modified "2023-09-24" @default.
- W200042785 title "Boosted Wrapper Induction" @default.
- W200042785 cites W1547214099 @default.
- W200042785 cites W1553019137 @default.
- W200042785 cites W1553229631 @default.
- W200042785 cites W1554734378 @default.
- W200042785 cites W1602152045 @default.
- W200042785 cites W1616576116 @default.
- W200042785 cites W2032210760 @default.
- W200042785 cites W2046491822 @default.
- W200042785 cites W2065568440 @default.
- W200042785 cites W2135479443 @default.
- W200042785 cites W2147810216 @default.
- W200042785 cites W2162340487 @default.
- W200042785 cites W2163915185 @default.
- W200042785 cites W2163918411 @default.
- W200042785 hasPublicationYear "2000" @default.
- W200042785 type Work @default.
- W200042785 sameAs 200042785 @default.
- W200042785 citedByCount "133" @default.
- W200042785 countsByYear W2000427852012 @default.
- W200042785 countsByYear W2000427852013 @default.
- W200042785 countsByYear W2000427852014 @default.
- W200042785 countsByYear W2000427852015 @default.
- W200042785 countsByYear W2000427852016 @default.
- W200042785 countsByYear W2000427852017 @default.
- W200042785 countsByYear W2000427852019 @default.
- W200042785 crossrefType "proceedings-article" @default.
- W200042785 hasAuthorship W200042785A5051886728 @default.
- W200042785 hasAuthorship W200042785A5080437721 @default.
- W200042785 hasConcept C111472728 @default.
- W200042785 hasConcept C119857082 @default.
- W200042785 hasConcept C124101348 @default.
- W200042785 hasConcept C138885662 @default.
- W200042785 hasConcept C154945302 @default.
- W200042785 hasConcept C177264268 @default.
- W200042785 hasConcept C195807954 @default.
- W200042785 hasConcept C199360897 @default.
- W200042785 hasConcept C2780586882 @default.
- W200042785 hasConcept C41008148 @default.
- W200042785 hasConcept C46686674 @default.
- W200042785 hasConcept C61423126 @default.
- W200042785 hasConceptScore W200042785C111472728 @default.
- W200042785 hasConceptScore W200042785C119857082 @default.
- W200042785 hasConceptScore W200042785C124101348 @default.
- W200042785 hasConceptScore W200042785C138885662 @default.
- W200042785 hasConceptScore W200042785C154945302 @default.
- W200042785 hasConceptScore W200042785C177264268 @default.
- W200042785 hasConceptScore W200042785C195807954 @default.
- W200042785 hasConceptScore W200042785C199360897 @default.
- W200042785 hasConceptScore W200042785C2780586882 @default.
- W200042785 hasConceptScore W200042785C41008148 @default.
- W200042785 hasConceptScore W200042785C46686674 @default.
- W200042785 hasConceptScore W200042785C61423126 @default.
- W200042785 hasLocation W2000427851 @default.
- W200042785 hasOpenAccess W200042785 @default.
- W200042785 hasPrimaryLocation W2000427851 @default.
- W200042785 hasRelatedWork W138033052 @default.
- W200042785 hasRelatedWork W1499578805 @default.
- W200042785 hasRelatedWork W1553019137 @default.
- W200042785 hasRelatedWork W1553229631 @default.
- W200042785 hasRelatedWork W1602152045 @default.
- W200042785 hasRelatedWork W1616576116 @default.
- W200042785 hasRelatedWork W1999595522 @default.
- W200042785 hasRelatedWork W2015551056 @default.
- W200042785 hasRelatedWork W2065568440 @default.
- W200042785 hasRelatedWork W2066636486 @default.
- W200042785 hasRelatedWork W2093559286 @default.
- W200042785 hasRelatedWork W2104086170 @default.
- W200042785 hasRelatedWork W2115461474 @default.
- W200042785 hasRelatedWork W2135479443 @default.
- W200042785 hasRelatedWork W2143349571 @default.
- W200042785 hasRelatedWork W2145948275 @default.
- W200042785 hasRelatedWork W2153072229 @default.
- W200042785 hasRelatedWork W2160196229 @default.
- W200042785 hasRelatedWork W2162340487 @default.
- W200042785 hasRelatedWork W2163915185 @default.
- W200042785 isParatext "false" @default.
- W200042785 isRetracted "false" @default.
- W200042785 magId "200042785" @default.
- W200042785 workType "article" @default.