/*******************************************************************************
* Copyright 2012-2019 Amazon.com, Inc. or its affiliates. All Rights Reserved.
* Licensed under the Apache License, Version 2.0 (the "License"). You may not use
* this file except in compliance with the License. A copy of the License is located at
*
* http://aws.amazon.com/apache2.0
*
* or in the "license" file accompanying this file.
* This file is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR
* CONDITIONS OF ANY KIND, either express or implied. See the License for the
* specific language governing permissions and limitations under the License.
* *****************************************************************************
*
* AWS Tools for Windows (TM) PowerShell (TM)
*
*/
using System;
using System.Collections.Generic;
using System.Linq;
using System.Management.Automation;
using System.Text;
using Amazon.PowerShell.Common;
using Amazon.Runtime;
using Amazon.Textract;
using Amazon.Textract.Model;
namespace Amazon.PowerShell.Cmdlets.TXT
{
///
/// Gets the results for an Amazon Textract asynchronous operation that analyzes text
/// in a document.
///
///
///
/// You start asynchronous text analysis by calling StartDocumentAnalysis, which
/// returns a job identifier (JobId
). When the text analysis operation finishes,
/// Amazon Textract publishes a completion status to the Amazon Simple Notification Service
/// (Amazon SNS) topic that's registered in the initial call to StartDocumentAnalysis
.
/// To get the results of the text-detection operation, first check that the status value
/// published to the Amazon SNS topic is SUCCEEDED
. If so, call GetDocumentAnalysis
,
/// and pass the job identifier (JobId
) from the initial call to StartDocumentAnalysis
.
/// GetDocumentAnalysis
returns an array of Block objects. The following
/// types of information are returned:
/// -
/// Form data (key-value pairs). The related information is returned in two Block
/// objects, each of type
KEY_VALUE_SET
: a KEY Block
object
/// and a VALUE Block
object. For example, Name: Ana Silva Carolina
/// contains a key and value. Name: is the key. Ana Silva Carolina is the
/// value.
/// -
/// Table and table cell data. A TABLE
Block
object contains information
/// about a detected table. A CELL Block
object is returned for each cell
/// in a table.
/// -
/// Lines and words of text. A LINE
Block
object contains one or more WORD
/// Block
objects. All lines and words that are detected in the document
/// are returned (including text that doesn't have a relationship with the value of the
/// StartDocumentAnalysis
FeatureTypes
input parameter).
/// -
/// Query. A QUERY Block object contains the query text, alias and link to the associated
/// Query results block object.
///
-
/// Query Results. A QUERY_RESULT Block object contains the answer to the query and an
/// ID that connects it to the query asked. This Block also contains a confidence score.
///
/// While processing a document with queries, look out for INVALID_REQUEST_PARAMETERS
/// output. This indicates that either the per page query limit has been exceeded or that
/// the operation is trying to query a page in the document which doesn’t exist.
///
/// Selection elements such as check boxes and option buttons (radio buttons) can be detected
/// in form data and in tables. A SELECTION_ELEMENT Block
object contains
/// information about a selection element, including the selection status.
///
/// Use the MaxResults
parameter to limit the number of blocks that are returned.
/// If there are more results than specified in MaxResults
, the value of
/// NextToken
in the operation response contains a pagination token for getting
/// the next set of results. To get the next page of results, call GetDocumentAnalysis
,
/// and populate the NextToken
request parameter with the token value that's
/// returned from the previous call to GetDocumentAnalysis
.
///
/// For more information, see Document
/// Text Analysis.
///
In the AWS.Tools.Textract module, this cmdlet automatically pages all available results to the pipeline - parameters related to iteration are only needed if you want to manually control the paginated output. To disable autopagination, use -NoAutoIteration.
///
[Cmdlet("Get", "TXTDocumentAnalysis")]
[OutputType("Amazon.Textract.Model.GetDocumentAnalysisResponse")]
[AWSCmdlet("Calls the Amazon Textract GetDocumentAnalysis API operation.", Operation = new[] {"GetDocumentAnalysis"}, SelectReturnType = typeof(Amazon.Textract.Model.GetDocumentAnalysisResponse))]
[AWSCmdletOutput("Amazon.Textract.Model.GetDocumentAnalysisResponse",
"This cmdlet returns an Amazon.Textract.Model.GetDocumentAnalysisResponse object containing multiple properties. The object can also be referenced from properties attached to the cmdlet entry in the $AWSHistory stack."
)]
public partial class GetTXTDocumentAnalysisCmdlet : AmazonTextractClientCmdlet, IExecutor
{
#region Parameter JobId
///
///
/// A unique identifier for the text-detection job. The JobId
is returned
/// from StartDocumentAnalysis
. A JobId
value is only valid
/// for 7 days.
///
///
#if !MODULAR
[System.Management.Automation.Parameter(Position = 0, ValueFromPipelineByPropertyName = true, ValueFromPipeline = true)]
#else
[System.Management.Automation.Parameter(Position = 0, ValueFromPipelineByPropertyName = true, ValueFromPipeline = true, Mandatory = true)]
[System.Management.Automation.AllowEmptyString]
[System.Management.Automation.AllowNull]
#endif
[Amazon.PowerShell.Common.AWSRequiredParameter]
public System.String JobId { get; set; }
#endregion
#region Parameter MaxResult
///
///
/// The maximum number of results to return per paginated call. The largest value that
/// you can specify is 1,000. If you specify a value greater than 1,000, a maximum of
/// 1,000 results is returned. The default value is 1,000.
///
///
[System.Management.Automation.Parameter(ValueFromPipelineByPropertyName = true)]
[Alias("MaxResults")]
public System.Int32? MaxResult { get; set; }
#endregion
#region Parameter NextToken
///
///
/// If the previous response was incomplete (because there are more blocks to retrieve),
/// Amazon Textract returns a pagination token in the response. You can use this pagination
/// token to retrieve the next set of blocks.
///
///
///
Note: In the AWS.Tools.Textract module, this parameter is only used if you are manually controlling output pagination of the service API call.
///
In order to manually control output pagination, use '-NextToken $null' for the first call and '-NextToken $AWSHistory.LastServiceResponse.NextToken' for subsequent calls.
///
///
[System.Management.Automation.Parameter(ValueFromPipelineByPropertyName = true)]
public System.String NextToken { get; set; }
#endregion
#region Parameter Select
///
/// Use the -Select parameter to control the cmdlet output. The default value is '*'.
/// Specifying -Select '*' will result in the cmdlet returning the whole service response (Amazon.Textract.Model.GetDocumentAnalysisResponse).
/// Specifying the name of a property of type Amazon.Textract.Model.GetDocumentAnalysisResponse will result in that property being returned.
/// Specifying -Select '^ParameterName' will result in the cmdlet returning the selected cmdlet parameter value.
///
[System.Management.Automation.Parameter(ValueFromPipelineByPropertyName = true)]
public string Select { get; set; } = "*";
#endregion
#region Parameter PassThru
///
/// Changes the cmdlet behavior to return the value passed to the JobId parameter.
/// The -PassThru parameter is deprecated, use -Select '^JobId' instead. This parameter will be removed in a future version.
///
[System.Obsolete("The -PassThru parameter is deprecated, use -Select '^JobId' instead. This parameter will be removed in a future version.")]
[System.Management.Automation.Parameter(ValueFromPipelineByPropertyName = true)]
public SwitchParameter PassThru { get; set; }
#endregion
#region Parameter NoAutoIteration
#if MODULAR
///
/// By default the cmdlet will auto-iterate and retrieve all results to the pipeline by performing multiple
/// service calls. If set, the cmdlet will retrieve only the next 'page' of results using the value of NextToken
/// as the start point.
///
[System.Management.Automation.Parameter(ValueFromPipelineByPropertyName = true)]
public SwitchParameter NoAutoIteration { get; set; }
#endif
#endregion
protected override void ProcessRecord()
{
this._AWSSignerType = "v4";
base.ProcessRecord();
var context = new CmdletContext();
// allow for manipulation of parameters prior to loading into context
PreExecutionContextLoad(context);
#pragma warning disable CS0618, CS0612 //A class member was marked with the Obsolete attribute
if (ParameterWasBound(nameof(this.Select)))
{
context.Select = CreateSelectDelegate(Select) ??
throw new System.ArgumentException("Invalid value for -Select parameter.", nameof(this.Select));
if (this.PassThru.IsPresent)
{
throw new System.ArgumentException("-PassThru cannot be used when -Select is specified.", nameof(this.Select));
}
}
else if (this.PassThru.IsPresent)
{
context.Select = (response, cmdlet) => this.JobId;
}
#pragma warning restore CS0618, CS0612 //A class member was marked with the Obsolete attribute
context.JobId = this.JobId;
#if MODULAR
if (this.JobId == null && ParameterWasBound(nameof(this.JobId)))
{
WriteWarning("You are passing $null as a value for parameter JobId which is marked as required. In case you believe this parameter was incorrectly marked as required, report this by opening an issue at https://github.com/aws/aws-tools-for-powershell/issues.");
}
#endif
context.MaxResult = this.MaxResult;
context.NextToken = this.NextToken;
// allow further manipulation of loaded context prior to processing
PostExecutionContextLoad(context);
var output = Execute(context) as CmdletOutput;
ProcessOutput(output);
}
#region IExecutor Members
#if MODULAR
public object Execute(ExecutorContext context)
{
var cmdletContext = context as CmdletContext;
#pragma warning disable CS0618, CS0612 //A class member was marked with the Obsolete attribute
var useParameterSelect = this.Select.StartsWith("^") || this.PassThru.IsPresent;
#pragma warning restore CS0618, CS0612 //A class member was marked with the Obsolete attribute
// create request and set iteration invariants
var request = new Amazon.Textract.Model.GetDocumentAnalysisRequest();
if (cmdletContext.JobId != null)
{
request.JobId = cmdletContext.JobId;
}
if (cmdletContext.MaxResult != null)
{
request.MaxResults = cmdletContext.MaxResult.Value;
}
// Initialize loop variant and commence piping
var _nextToken = cmdletContext.NextToken;
var _userControllingPaging = this.NoAutoIteration.IsPresent || ParameterWasBound(nameof(this.NextToken));
var client = Client ?? CreateClient(_CurrentCredentials, _RegionEndpoint);
do
{
request.NextToken = _nextToken;
CmdletOutput output;
try
{
var response = CallAWSServiceOperation(client, request);
object pipelineOutput = null;
if (!useParameterSelect)
{
pipelineOutput = cmdletContext.Select(response, this);
}
output = new CmdletOutput
{
PipelineOutput = pipelineOutput,
ServiceResponse = response
};
_nextToken = response.NextToken;
}
catch (Exception e)
{
output = new CmdletOutput { ErrorResponse = e };
}
ProcessOutput(output);
} while (!_userControllingPaging && AutoIterationHelpers.HasValue(_nextToken));
if (useParameterSelect)
{
WriteObject(cmdletContext.Select(null, this));
}
return null;
}
#else
public object Execute(ExecutorContext context)
{
var cmdletContext = context as CmdletContext;
// create request
var request = new Amazon.Textract.Model.GetDocumentAnalysisRequest();
if (cmdletContext.JobId != null)
{
request.JobId = cmdletContext.JobId;
}
if (cmdletContext.MaxResult != null)
{
request.MaxResults = cmdletContext.MaxResult.Value;
}
if (cmdletContext.NextToken != null)
{
request.NextToken = cmdletContext.NextToken;
}
CmdletOutput output;
// issue call
var client = Client ?? CreateClient(_CurrentCredentials, _RegionEndpoint);
try
{
var response = CallAWSServiceOperation(client, request);
object pipelineOutput = null;
pipelineOutput = cmdletContext.Select(response, this);
output = new CmdletOutput
{
PipelineOutput = pipelineOutput,
ServiceResponse = response
};
}
catch (Exception e)
{
output = new CmdletOutput { ErrorResponse = e };
}
return output;
}
#endif
public ExecutorContext CreateContext()
{
return new CmdletContext();
}
#endregion
#region AWS Service Operation Call
private Amazon.Textract.Model.GetDocumentAnalysisResponse CallAWSServiceOperation(IAmazonTextract client, Amazon.Textract.Model.GetDocumentAnalysisRequest request)
{
Utils.Common.WriteVerboseEndpointMessage(this, client.Config, "Amazon Textract", "GetDocumentAnalysis");
try
{
#if DESKTOP
return client.GetDocumentAnalysis(request);
#elif CORECLR
return client.GetDocumentAnalysisAsync(request).GetAwaiter().GetResult();
#else
#error "Unknown build edition"
#endif
}
catch (AmazonServiceException exc)
{
var webException = exc.InnerException as System.Net.WebException;
if (webException != null)
{
throw new Exception(Utils.Common.FormatNameResolutionFailureMessage(client.Config, webException.Message), webException);
}
throw;
}
}
#endregion
internal partial class CmdletContext : ExecutorContext
{
public System.String JobId { get; set; }
public System.Int32? MaxResult { get; set; }
public System.String NextToken { get; set; }
public System.Func Select { get; set; } =
(response, cmdlet) => response;
}
}
}