OpenAI on your own data frequently returns "the requested information is not available in the retrieved data"

Antoine DRIARD 0 Reputation points
2024-04-04T21:06:45.1+00:00

Hi,

We are currently developing a new module to our application that requires that Azure OpenAI analyzes the content of a CSV file, searching for anomalies (unexpected data, possible entry errors).

When it works, it works pretty well.

But very frequently, we get this error message "the requested information is not available in the retrieved data". When we try again a few seconds later, sometimes it works well, sometimes we get the error again. It is highly unpredictible.

Our chain of command is:

  • upload a csv file as azure blob
  • create an index
  • create a data source
  • create an indexer
  • wait until the indexer has run
  • wait until the index stats show 1 document indexed
  • set the OpenAI settings
  • send the openAI prompt (system and user)

Here is our config:

Tenant on "France Central" for OpenAI and AISearch

AISearch

  • standard tier
  • indexer: config data below
  • index: config data below
  • datasource : config data below

OpenAI

  • configuration data below (serialized by us into JSON)

Azure.AI.OpenAI nugget updated to latest version

deployment with gpt4 32k

thanks for your help, greatly appreciated.

Antoine


config information below:

Indexer definition:

{

"@odata.context": "https://search-XXXXXXXXXXXXXX-beta-fc-2.search.windows.net/$metadata#indexers/$entity",

"@odata.etag": ""0x8DC54C2DA1745EE"",

"name": "indexer-6192915d50c342408e65feacc31c6902",

"description": null,

"dataSourceName": "ds-6192915d50c342408e65feacc31c6902",

"skillsetName": null,

"targetIndexName": "index-6192915d50c342408e65feacc31c6902",

"disabled": null,

"schedule": null,

"parameters": {

"batchSize": null,

"maxFailedItems": null,

"maxFailedItemsPerBatch": null

},

"fieldMappings": [],

"outputFieldMappings": [],

"cache": null,

"encryptionKey": null

}

Index definition:

{

"@odata.context": "https://search-XXXXXXXXX-beta-fc-2.search.windows.net/$metadata#indexes/$entity",

"@odata.etag": ""0x8DC54C2D6B96CD2"",

"name": "index-6192915d50c342408e65feacc31c6902",

"defaultScoringProfile": null,

"fields": [

{

  "name": "content",

  "type": "Edm.String",

  "searchable": true,

  "filterable": false,

  "retrievable": true,

  "stored": true,

  "sortable": false,

  "facetable": false,

  "key": false,

  "indexAnalyzer": null,

  "searchAnalyzer": null,

  "analyzer": null,

  "normalizer": null,

  "dimensions": null,

  "vectorSearchProfile": null,

  "synonymMaps": []

},

{

  "name": "title",

  "type": "Edm.String",

  "searchable": true,

  "filterable": false,

  "retrievable": true,

  "stored": true,

  "sortable": false,

  "facetable": false,

  "key": false,

  "indexAnalyzer": null,

  "searchAnalyzer": null,

  "analyzer": null,

  "normalizer": null,

  "dimensions": null,

  "vectorSearchProfile": null,

  "synonymMaps": []

},

{

  "name": "description",

  "type": "Edm.String",

  "searchable": true,

  "filterable": false,

  "retrievable": true,

  "stored": true,

  "sortable": false,

  "facetable": false,

  "key": false,

  "indexAnalyzer": null,

  "searchAnalyzer": null,

  "analyzer": null,

  "normalizer": null,

  "dimensions": null,

  "vectorSearchProfile": null,

  "synonymMaps": []

},

{

  "name": "id",

  "type": "Edm.String",

  "searchable": false,

  "filterable": true,

  "retrievable": true,

  "stored": true,

  "sortable": true,

  "facetable": true,

  "key": true,

  "indexAnalyzer": null,

  "searchAnalyzer": null,

  "analyzer": null,

  "normalizer": null,

  "dimensions": null,

  "vectorSearchProfile": null,

  "synonymMaps": []

}

],

"scoringProfiles": [],

"corsOptions": null,

"suggesters": [],

"analyzers": [],

"normalizers": [],

"tokenizers": [],

"tokenFilters": [],

"charFilters": [],

"encryptionKey": null,

"similarity": {

"@odata.type": "#Microsoft.Azure.Search.BM25Similarity",

"k1": null,

"b": null

},

"semantic": {

"defaultConfiguration": null,

"configurations": [

  {

    "name": "default",

    "prioritizedFields": {

      "titleField": {

        "fieldName": "title"

      },

      "prioritizedContentFields": [

        {

          "fieldName": "content"

        },

        {

          "fieldName": "description"

        }

      ],

      "prioritizedKeywordsFields": []

    }

  }

]

},

"vectorSearch": null

}

Data source:

{

"@odata.context": "https://search-XXXXXXXXX-beta-fc-2.search.windows.net/$metadata#datasources/$entity",

"@odata.etag": ""0x8DC54C2D6CF7424"",

"name": "ds-6192915d50c342408e65feacc31c6902",

"description": null,

"type": "azureblob",

"subtype": null,

"credentials": {

"connectionString": "DefaultEndpointsProtocol=https;AccountName=stXXXXXXbeta;AccountKey=..."

},

"container": {

"name": "analysis",

"query": "Job-6192915d50c342408e65feacc31c6902/"

},

"dataChangeDetectionPolicy": null,

"dataDeletionDetectionPolicy": null,

"encryptionKey": null,

"identity": null

}

OpenAI configuration

{

"ChoiceCount": null,

"DeploymentName": "md-gpt-4-32k-XXXXXX-fc",

"FrequencyPenalty": 0.0,

"MaxTokens": 8000,

"NucleusSamplingFactor": null,

"PresencePenalty": 0.0,

"StopSequences": [],

"Temperature": 0.7,

"TokenSelectionBiases": {},

"Functions": [],

"FunctionCall": null,

"AzureExtensionsOptions": {

    "Extensions": [{

        "Authentication": {

            "Key": "Our Key"

        },

        "DocumentCount": null,

        "ShouldRestrictResultScope": true,

        "Strictness": 1,

        "RoleInformation": null,

        "SearchEndpoint": "https://search-XXXXXX-beta-fc-2.search.windows.net",

        "IndexName": "index-6192915d50c342408e65feacc31c6902",

        "FieldMappingOptions": {

            "TitleFieldName": "title",

            "UrlFieldName": null,

            "FilepathFieldName": null,

            "ContentFieldNames": ["content", "description"],

            "ContentFieldSeparator": null,

            "VectorFieldNames": [],

            "ImageVectorFieldNames": []

        },

        "QueryType": null,

        "SemanticConfiguration": null,

        "Filter": null,

        "VectorizationSource": null

    }],

    "EnhancementOptions": null

},

"ToolChoice": null,

"Messages": [{

    "Content": "Our system prompt",

    "Name": null,

    "Role": {}

}, {

    "Content": "Our user prompt",

    "MultimodalContentItems": null,

    "Name": null,

    "Role": {}

}],

"User": null,

"Seed": null,

"EnableLogProbabilities": null,

"LogProbabilitiesPerToken": null,

"ResponseFormat": null,

"Tools": []

}

Azure AI Search
Azure AI Search
An Azure search service with built-in artificial intelligence capabilities that enrich information to help identify and explore relevant content at scale.
992 questions
Azure OpenAI Service
Azure OpenAI Service
An Azure service that provides access to OpenAI’s GPT-3 models with enterprise capabilities.
3,040 questions
{count} votes

1 answer

Sort by: Most helpful
  1. Deleted

    This answer has been deleted due to a violation of our Code of Conduct. The answer was manually reported or identified through automated detection before action was taken. Please refer to our Code of Conduct for more information.


    Comments have been turned off. Learn more

Your answer

Answers can be marked as Accepted Answers by the question author, which helps users to know the answer solved the author's problem.