Web Service Method: Annotate and Store from File
Web Service Method: Annotate and Store from File
Description |
|---|
[file] Annotates the file with extracted concepts in RDF/XML format and stores it in the remote repository. |
URL: /extractor/api/annotate
Supported Methods |
|---|
POST |
Content-Type: multipart/form-data
Parameter | Type | Required | Description |
|---|---|---|---|
categorizationWithPpxBoost | Boolean | false | Use Extractor boosting, default = false |
categorize | Boolean | false | Categorization extraction, default = false |
conceptMinimumScore | Double | false | Minimum required score of concepts, default = 0 |
conceptSchemeFilters | Array of String | false | Concept scheme URI filters |
corpusScoring | Array of String | false | Corpus term scoring. Enabled if corpusIds (UUID) are provided. |
customAttributeFilters | Array of CustomProperty | false | Custom attribute (property uri and string value) filters |
customClassFilters | Array of String | false | Custom class URI filters |
disambiguate | Boolean | false | Use thesaurus based disambiguation, default = false |
displayText | Boolean | false | Include text extracted from url in response, default = false |
documentClassifierIds | Array of String | false | Enable document classification by giving the document classifier IDs as input. |
documentId | String | false | Internal ID of the document, taken from documentUri. |
documentUri | String | true | URI of annotated document, used as ID |
extractorVersion | String | false | Version of PPX Extractor used |
file | MultipartFile | true | File to be annotated (Word, Excel, PowerPoint, PDF, open document) - Mime type of request must be 'multipart/form-data' |
filterNestedConcepts | Boolean | false | Remove concepts matches which are contained within other matches, default = true |
findPersonNames | Boolean | false | Deprecated (use nerParameters) - extracts person names from the given text |
language | String | false | Extraction language (en|de|es|fr|...) |
lemmatization | Boolean | false | Use lemmatization, default = true |
locationExtraction | Boolean | false | Deprecated (use nerParameters) - extracts locations from the given text |
nerParameters | Array of NERConfig | false | Array of models that are used for Named Entity Recognition |
numberOfConcepts | Integer | false | Retrieve number of concepts, default = 25 |
numberOfTerms | Integer | false | Retrieve number of terms, default = 25 |
phraseLength | Integer | false | Phrase length, default = 4 |
projectId | Array of String | false | Thesaurus projectIds |
properties | Array of String | false | Array of custom class attributes and relations that will be fetched by providing their property URIs as input. Furthermore it supports http://www.w3.org/1999/02/22-rdf-syntax-ns#type. Set to all to fetch all properties. |
regexFilename | String | false | File name for regex patterns |
resultFilterSparql | String | false | Specify an optional SPARQL query for filtering the RDF result |
sentimentAnalysis | Boolean | false | Sentiment analysis, default: false |
shadowConceptCorpusId | Array of String | false | Shadow concepts calculation. Enabled if corpusIds (UUID) are provided. |
showMatchingDetails | Boolean | false | Shows which concept labels where found inside the text, default = false |
showMatchingPosition | Boolean | false | Shows the position of the matched text. Only shown if showMatchingDetails = true. default = false |
tfidfScoring | Boolean | false | Use TFIDF scoring, default = false |
title | String | false | Title of the document |
useRelatedConcepts | Boolean | false | Retrieve related concepts, default = false |
useTransitiveBroaderConcepts | Boolean | false | Retrieve transitive broader concepts, default = false |
useTransitiveBroaderTopConcepts | Boolean | false | Retrieve transitive broader top concepts, default = false |
useTypes | Boolean | false | Retrieve custom types for concepts, default = false |
Attribute | Type | Required | Comment |
|---|---|---|---|
property | String | false | Property |
value | String | false | Value |
{
"property" : "https://semantic-web.com/api/property#26100",
"value" : "some value"
}Attribute | Type | Required | Comment |
|---|---|---|---|
| Method | false | Method used for Named Entity Extraction. (default: MAXIMUM_ENTROPY) RULE_BASED | MAXIMUM_ENTROPY |
| String | false | Type of Named Entity Model. Pre-defined models for MAXIMUM_ENTROPY: person, organization, location |
{
"method" : "MAXIMUM_ENTROPY",
"type" : "https://semantic-web.com/api/type#3179"
}An ObjectStreamField object.
Attribute | Type | Required | Comment |
|---|---|---|---|
field | Field | false | |
name | String | false | |
offset | int | false | |
signature | String | false | |
type | Class | false | |
unshared | Boolean | false |
Click here to expand...
{
"field" : {
"genericInfo" : {
"factory" : null,
"tree" : null,
"genericType" : null
},
"declaredAnnotations" : { },
"overrideFieldAccessor" : { },
"signature" : "some signature",
"annotations" : [ 48 ],
"securityCheckCache" : { },
"slot" : 26477,
"fieldAccessor" : { },
"modifiers" : 24139,
"type" : {
"annotationData" : null,
"genericInfo" : null,
"ENUM" : 32463,
"enumConstantDirectory" : { },
"classRedefinedCount" : 22746,
"initted" : false,
"cachedConstructor" : null,
"useCaches" : true,
"SYNTHETIC" : 27448,
"annotationType" : null,
"newInstanceCallerCache" : null,
"reflectionData" : null,
"classValueMap" : { },
"serialPersistentFields" : [ null ],
"serialVersionUID" : 10320,
"ANNOTATION" : 14968,
"enumConstants" : [ null, null ],
"name" : "some name",
"reflectionFactory" : null,
"allPermDomain" : null
},
"ACCESS_PERMISSION" : {
"serialVersionUID" : 26505,
"name" : "some name"
},
"root" : {
"genericInfo" : null,
"declaredAnnotations" : { },
"overrideFieldAccessor" : null,
"signature" : "some signature",
"annotations" : [ 119, 46, 76 ],
"securityCheckCache" : null,
"slot" : 5243,
"fieldAccessor" : null,
"modifiers" : 32720,
"type" : null,
"ACCESS_PERMISSION" : null,
"root" : null,
"name" : "some name",
"override" : false,
"reflectionFactory" : null,
"clazz" : null
},
"name" : "some name",
"override" : true,
"reflectionFactory" : {
"inflationThreshold" : 19524,
"initted" : true,
"soleInstance" : null,
"reflectionFactoryAccessPerm" : null,
"langReflectAccess" : null,
"noInflation" : false
},
"clazz" : {
"annotationData" : null,
"genericInfo" : null,
"ENUM" : 14462,
"enumConstantDirectory" : { },
"classRedefinedCount" : 26901,
"initted" : true,
"cachedConstructor" : null,
"useCaches" : true,
"SYNTHETIC" : 15733,
"annotationType" : null,
"newInstanceCallerCache" : null,
"reflectionData" : null,
"classValueMap" : { },
"serialPersistentFields" : [ null, null ],
"serialVersionUID" : 1996,
"ANNOTATION" : 14537,
"enumConstants" : [ null, null ],
"name" : "some name",
"reflectionFactory" : null,
"allPermDomain" : null
}
},
"offset" : 8626,
"signature" : "some signature",
"unshared" : false,
"name" : "some name",
"type" : {
"annotationData" : {
"declaredAnnotations" : { },
"redefinedCount" : 4678,
"annotations" : { }
},
"genericInfo" : {
"factory" : null,
"superclass" : null,
"tree" : null,
"typeParams" : [ null, null, null ],
"NONE" : null,
"superInterfaces" : [ null, null, null ]
},
"ENUM" : 4825,
"enumConstantDirectory" : { },
"classRedefinedCount" : 19620,
"initted" : true,
"cachedConstructor" : {
"genericInfo" : null,
"declaredAnnotations" : { },
"hasRealParameterData" : false,
"parameterTypes" : [ null, null ],
"signature" : "some signature",
"annotations" : [ 0, 59 ],
"securityCheckCache" : null,
"constructorAccessor" : null,
"slot" : 29100,
"modifiers" : 9877,
"ACCESS_PERMISSION" : null,
"exceptionTypes" : [ null ],
"root" : null,
"override" : false,
"parameterAnnotations" : [ 74, 86 ],
"reflectionFactory" : null,
"clazz" : null,
"parameters" : [ null, null ]
},
"useCaches" : false,
"SYNTHETIC" : 24161,
"annotationType" : {
"inherited" : false,
"members" : { },
"memberDefaults" : { },
"$assertionsDisabled" : false,
"memberTypes" : { },
"retention" : "RUNTIME"
},
"newInstanceCallerCache" : {
"annotationData" : null,
"genericInfo" : null,
"ENUM" : 1033,
"enumConstantDirectory" : { },
"classRedefinedCount" : 10123,
"initted" : false,
"cachedConstructor" : null,
"useCaches" : false,
"SYNTHETIC" : 6635,
"annotationType" : null,
"newInstanceCallerCache" : null,
"reflectionData" : null,
"classValueMap" : { },
"serialPersistentFields" : [ null, null, null ],
"serialVersionUID" : 6521,
"ANNOTATION" : 26847,
"enumConstants" : [ null, null, null ],
"name" : "some name",
"reflectionFactory" : null,
"allPermDomain" : null
},
"reflectionData" : {
"next" : null,
"discovered" : null,
"referent" : null,
"pending" : null,
"lock" : null,
"clock" : 24478,
"queue" : null,
"timestamp" : 16613
},
"classValueMap" : { },
"serialPersistentFields" : [ {
"field" : null,
"offset" : 22640,
"signature" : "some signature",
"unshared" : true,
"name" : "some name",
"type" : null
}, {
"field" : null,
"offset" : 23255,
"signature" : "some signature",
"unshared" : false,
"name" : "some name",
"type" : null
} ],
"serialVersionUID" : 20269,
"ANNOTATION" : 24004,
"enumConstants" : [ { }, { } ],
"name" : "some name",
"reflectionFactory" : {
"inflationThreshold" : 17765,
"initted" : true,
"soleInstance" : null,
"reflectionFactoryAccessPerm" : null,
"langReflectAccess" : null,
"noInflation" : true
},
"allPermDomain" : {
"staticPermissions" : false,
"debug" : null,
"hasAllPerm" : false,
"codesource" : null,
"permissions" : null,
"classloader" : null,
"principals" : [ null, null ],
"key" : null
}
}
}text/plain
Status: 200 - OK