Matches in SemOpenAlex for { <https://semopenalex.org/work/W1988861783> ?p ?o ?g. }
- W1988861783 endingPage "326" @default.
- W1988861783 startingPage "307" @default.
- W1988861783 abstract "We present the architecture and data model for TEXTRACT, a robust, scalable and configurable document analysis framework. TEXTRACT has been engineered as a pipeline architecture, allowing for rapid prototyping and application development by freely mixing reusable, existing, language analysis plugins and custom, new, plugins with customizable functionality. We discuss design issues which arise from requirements of industrial strength efficiency and scalability, and which are further constrained by plugin interactions, both among themselves, and with a common data model comprising an annotation store, document vocabulary and a lexical cache. We exemplify some of these by focusing on a meta-plugin: an interpreter for annotation-based finite state transduction, through which many linguistic filters can be implemented as stand-alone plugins. The framework and component plugins have been extensively deployed in both research and industrial environments, for a broad range of text analysis and mining tasks." @default.
- W1988861783 created "2016-06-24" @default.
- W1988861783 creator A5055485322 @default.
- W1988861783 creator A5068769768 @default.
- W1988861783 creator A5048792646 @default.
- W1988861783 date "2004-09-01" @default.
- W1988861783 modified "2023-09-27" @default.
- W1988861783 title "The Talent system: TEXTRACT architecture and data model" @default.
- W1988861783 cites W1503310635 @default.
- W1988861783 cites W1539395461 @default.
- W1988861783 cites W1543884596 @default.
- W1988861783 cites W1662519165 @default.
- W1988861783 cites W178298440 @default.
- W1988861783 cites W1985565920 @default.
- W1988861783 cites W2007051236 @default.
- W1988861783 cites W2008112715 @default.
- W1988861783 cites W2033319677 @default.
- W1988861783 cites W2044070623 @default.
- W1988861783 cites W2046319108 @default.
- W1988861783 cites W2046599838 @default.
- W1988861783 cites W2058763402 @default.
- W1988861783 cites W2066066594 @default.
- W1988861783 cites W2068737686 @default.
- W1988861783 cites W2081508358 @default.
- W1988861783 cites W2096797897 @default.
- W1988861783 cites W2098167774 @default.
- W1988861783 cites W2098643647 @default.
- W1988861783 cites W2100703899 @default.
- W1988861783 cites W2103147879 @default.
- W1988861783 cites W2108455276 @default.
- W1988861783 cites W2119769170 @default.
- W1988861783 cites W2126637410 @default.
- W1988861783 cites W2133149548 @default.
- W1988861783 cites W2143562645 @default.
- W1988861783 cites W2149367074 @default.
- W1988861783 cites W2151157246 @default.
- W1988861783 cites W2160439261 @default.
- W1988861783 cites W2171064373 @default.
- W1988861783 cites W2426119782 @default.
- W1988861783 cites W2649172422 @default.
- W1988861783 cites W30314283 @default.
- W1988861783 cites W4508078 @default.
- W1988861783 doi "https://doi.org/10.1017/s1351324904003493" @default.
- W1988861783 hasPublicationYear "2004" @default.
- W1988861783 type Work @default.
- W1988861783 sameAs 1988861783 @default.
- W1988861783 citedByCount "22" @default.
- W1988861783 countsByYear W19888617832012 @default.
- W1988861783 countsByYear W19888617832013 @default.
- W1988861783 countsByYear W19888617832014 @default.
- W1988861783 crossrefType "journal-article" @default.
- W1988861783 hasAuthorship W1988861783A5048792646 @default.
- W1988861783 hasAuthorship W1988861783A5055485322 @default.
- W1988861783 hasAuthorship W1988861783A5068769768 @default.
- W1988861783 hasConcept C115903868 @default.
- W1988861783 hasConcept C118524514 @default.
- W1988861783 hasConcept C121332964 @default.
- W1988861783 hasConcept C123657996 @default.
- W1988861783 hasConcept C142362112 @default.
- W1988861783 hasConcept C153349607 @default.
- W1988861783 hasConcept C154945302 @default.
- W1988861783 hasConcept C168167062 @default.
- W1988861783 hasConcept C199360897 @default.
- W1988861783 hasConcept C2776321320 @default.
- W1988861783 hasConcept C41008148 @default.
- W1988861783 hasConcept C43521106 @default.
- W1988861783 hasConcept C48044578 @default.
- W1988861783 hasConcept C4924752 @default.
- W1988861783 hasConcept C77088390 @default.
- W1988861783 hasConcept C97355855 @default.
- W1988861783 hasConceptScore W1988861783C115903868 @default.
- W1988861783 hasConceptScore W1988861783C118524514 @default.
- W1988861783 hasConceptScore W1988861783C121332964 @default.
- W1988861783 hasConceptScore W1988861783C123657996 @default.
- W1988861783 hasConceptScore W1988861783C142362112 @default.
- W1988861783 hasConceptScore W1988861783C153349607 @default.
- W1988861783 hasConceptScore W1988861783C154945302 @default.
- W1988861783 hasConceptScore W1988861783C168167062 @default.
- W1988861783 hasConceptScore W1988861783C199360897 @default.
- W1988861783 hasConceptScore W1988861783C2776321320 @default.
- W1988861783 hasConceptScore W1988861783C41008148 @default.
- W1988861783 hasConceptScore W1988861783C43521106 @default.
- W1988861783 hasConceptScore W1988861783C48044578 @default.
- W1988861783 hasConceptScore W1988861783C4924752 @default.
- W1988861783 hasConceptScore W1988861783C77088390 @default.
- W1988861783 hasConceptScore W1988861783C97355855 @default.
- W1988861783 hasIssue "3-4" @default.
- W1988861783 hasLocation W19888617831 @default.
- W1988861783 hasOpenAccess W1988861783 @default.
- W1988861783 hasPrimaryLocation W19888617831 @default.
- W1988861783 hasRelatedWork W2152033542 @default.
- W1988861783 hasRelatedWork W2366465394 @default.
- W1988861783 hasRelatedWork W2382623646 @default.
- W1988861783 hasRelatedWork W2384305342 @default.
- W1988861783 hasRelatedWork W2392098988 @default.
- W1988861783 hasRelatedWork W2392817843 @default.
- W1988861783 hasRelatedWork W2909876463 @default.
- W1988861783 hasRelatedWork W3028015399 @default.