#include <bt_rlp_managed.h>
Public Member Functions | |
virtual bool | GetConsistentType ()=0 |
virtual cli::array < NamedEntityData^ >^ | GetNamedEntityResultData (bool StripAffixes)=0 |
virtual String^ | GetProcessorReport ()=0 |
Get a report of the processors defined in this context. | |
virtual String^ | GetProperty (String^ property)=0 |
Get a context property value. | |
virtual Object^ | GetResultData (ResultType resultType, bool safeDataOnly)=0 |
Retrieve the data for a particular entity after processing input. | |
virtual void | ProcessBuffer (cli::array< System::Byte >^data, LanguageID language, String^ encoding, String^ mime_type)=0 |
Read and process data from a byte[], with optionally specified Language. | |
virtual void | ProcessBuffer (cli::array< System::Char >^data, LanguageID language)=0 |
Read and process data from a char[], with optionally specified Language. | |
virtual void | ProcessBuffer (String^ data, LanguageID language)=0 |
Read and process data from a String, with optionally specified Language. | |
virtual void | ProcessFile (String^ data_file_pathname, LanguageID language, String^ encoding, String^ mime_type)=0 |
Read and process data from a file, with optionally specified Language, Encoding, and MIME type/charset. | |
virtual void | SetConsistentType (bool flag)=0 |
virtual void | SetProperty (String^ property, String^ value)=0 |
Set a context property value. | |
virtual | ~Context () |
virtual BasisTechnology::RLP::Context::~Context | ( | ) | [virtual] |
virtual bool BasisTechnology::RLP::Context::GetConsistentType | ( | ) | [pure virtual] |
virtual cli::array<NamedEntityData^> ^ BasisTechnology::RLP::Context::GetNamedEntityResultData | ( | bool | StripAffixes | ) | [pure virtual] |
virtual String ^ BasisTechnology::RLP::Context::GetProcessorReport | ( | ) | [pure virtual] |
virtual String ^ BasisTechnology::RLP::Context::GetProperty | ( | String^ | property | ) | [pure virtual] |
property | the name of the property |
virtual Object ^ BasisTechnology::RLP::Context::GetResultData | ( | ResultType | resultType, | |
bool | safeDataOnly | |||
) | [pure virtual] |
resultType | the type of data to return. | |
safeDataOnly | if true, then some return types change to avoid unsafe pointers. |
For many of the result types, GetResultData
returns an ordinary managed object.
For several result types, GetResultData
returns an unsafe pointer to data we already have unless the safeDataOnly
flag is set. This avoids the cost of copying the data. To return a managed copy of the original data, set safeDataOnly
to true.
Entity Type | Return type | Safe return type | Comments |
---|---|---|---|
TOKEN | string[] | string[] | One string per-token> |
PART_OF_SPEECH | string[] | string[] | One string per-token |
SENTENCE_BOUNDARY | IntegerVectorValue | SafeIntegerVectorValue | One integer per sentence; token index of the boundary token |
BASE_NOUN_PHRASE | IntegerVectorValue | SafeIntegerVectorValue | Two integers per phrase; token indices of the start and end |
DETECTED_LANGUAGE | uint (boxed) | uint (boxed) | Actually a LanguageID |
DETECTED_ENCODING | String | String | MIME charset or MIME type of the input data |
NAMED_ENTITY | IntegerVectorValue | SafeIntegerVectorValue | Three integers per phrase; token indices of the start and end plus the entity type |
TOKEN_OFFSET | IntegerVectorValue | SafeIntegerVectorValue | Two integers per token; character indices of the start and end. |
STEM | string[] | string[] | Stemmed form of the each token. |
NORMALIZED_TOKEN | string[] | string[] | Normalized form of the each token; not all languages/processors produce this result type. |
COMPOUND | Hashtable | Hashtable | The keys are uint token indices, and the values are string[] arrays of compound components. |
READING | Hashtable | Hashtable | The keys are uint token indices, and the values are string[] arrays of alternative reading. |
RAW_TEXT | SingletonStringValue | char[] | The input data, converted to UTF-16 |
STOPWORD | IntegerVectorValue | SafeIntegerVectorValue | 1One integer per stop-word; the indices of the tokens identified as stopwords. |
virtual void BasisTechnology::RLP::Context::ProcessBuffer | ( | cli::array< System::Byte >^ | data, | |
LanguageID | language, | |||
String^ | encoding, | |||
String^ | mime_type | |||
) | [pure virtual] |
data | the input data to process. | |
language | the language, or LanguageID.UNKNOWN, of the input data. | |
encoding | the encoding of the input file. Null if unknown. | |
mime_type | the MIME character set or type of the input file. Null if unknown. |
virtual void BasisTechnology::RLP::Context::ProcessBuffer | ( | cli::array< System::Char >^ | data, | |
LanguageID | language | |||
) | [pure virtual] |
data | the input data to process. | |
language | the language, or LanguageID.UNKNOWN, of the input data. |
virtual void BasisTechnology::RLP::Context::ProcessBuffer | ( | String^ | data, | |
LanguageID | language | |||
) | [pure virtual] |
data | the input data to process. | |
language | the language, or LanguageID.UNKNOWN, of the input data. |
virtual void BasisTechnology::RLP::Context::ProcessFile | ( | String^ | data_file_pathname, | |
LanguageID | language, | |||
String^ | encoding, | |||
String^ | mime_type | |||
) | [pure virtual] |
data_file_pathname | the input data to process. | |
language | the language, or LanguageID.UNKNOWN, of the input data. | |
encoding | the encoding of the input file. Null if unknown. | |
mime_type | the MIME character set or type of the input file. Null if unknown. |
virtual void BasisTechnology::RLP::Context::SetConsistentType | ( | bool | flag | ) | [pure virtual] |
virtual void BasisTechnology::RLP::Context::SetProperty | ( | String^ | property, | |
String^ | value | |||
) | [pure virtual] |
property | the name of the property | |
value | the value of the property |
Copyright © 2004-2008 Basis Technology Corporation. All Rights Reserved.