Azure-Samples
diff --git a/‎…xt_chatcompletions_example_restapi.ipynb‎ ‎…AG_chatcompletions_example_restapi.ipynb‎Basic_Samples/GPT-4V/in_context_chatcompletions_example_restapi.ipynb renamed to Basic_Samples/GPT-4V/RAG_chatcompletions_example_restapi.ipynb
Lines changed: 46 additions & 60 deletions b/‎…xt_chatcompletions_example_restapi.ipynb‎ ‎…AG_chatcompletions_example_restapi.ipynb‎Basic_Samples/GPT-4V/in_context_chatcompletions_example_restapi.ipynb renamed to Basic_Samples/GPT-4V/RAG_chatcompletions_example_restapi.ipynb
Lines changed: 46 additions & 60 deletions
diff --git a/‎Basic_Samples/GPT-4V/README.md‎
Lines changed: 30 additions & 3 deletions b/‎Basic_Samples/GPT-4V/README.md‎
Lines changed: 30 additions & 3 deletions
diff --git a/‎Basic_Samples/GPT-4V/basic_chatcompletions_example_restapi.ipynb‎
Lines changed: 23 additions & 84 deletions b/‎Basic_Samples/GPT-4V/basic_chatcompletions_example_restapi.ipynb‎
Lines changed: 23 additions & 84 deletions
@@ -13,15 +13,15 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 1,
+   "execution_count": 7,
    "id": "f4b3d21a",
    "metadata": {},
    "outputs": [],
    "source": [
     "import json\n",
     "import os\n",
-    "import requests\n",
-    "import base64"
+    "import base64\n",
+    "%run shared_functions.ipynb"
    ]
   },
   {
@@ -32,12 +32,12 @@
     "### Setup Parameters\n",
     "\n",
     "\n",
-    "Here we will load the configurations from _config.json_ file to setup search_service_endpoint, search_index_name, search_query_key, deployment_name, openai_api_base, openai_api_key and openai_api_version."
+    "Here we will load the configurations from _config.json_ file to setup search_service_endpoint, search_index_name, and search_query_key"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 2,
+   "execution_count": 8,
    "id": "fd85fb30",
    "metadata": {},
    "outputs": [],
@@ -53,71 +53,58 @@
     "search_index_name = config_details['AZURE_SEARCH_INDEX_NAME']\n",
     "\n",
     "# Setting up the Azure Search service query key\n",
-    "search_query_key = os.getenv(\"AZURE_SEARCH_QUERY_KEY\")\n",
-    "\n",
-    "# Setting up the deployment name\n",
-    "deployment_name = config_details['GPT-4V_MODEL']\n",
-    "\n",
-    "# The base URL for your Azure OpenAI resource. e.g. \"https://<your resource name>.openai.azure.com\"\n",
-    "openai_api_base = config_details['OPENAI_API_BASE']\n",
-    "\n",
-    "# The API key for your Azure OpenAI resource.\n",
-    "openai_api_key = os.getenv(\"OPENAI_API_KEY\")\n",
-    "\n",
-    "# Currently OPENAI API have the following versions available: 2022-12-01. All versions follow the YYYY-MM-DD date structure.\n",
-    "openai_api_version = config_details['OPENAI_API_VERSION']"
+    "search_query_key = os.getenv(\"AZURE_SEARCH_QUERY_KEY\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Create Azure Search Index"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 3,
+   "execution_count": 10,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Using the Azure Search service create the index with image embeddings\n",
+    "#https://github.com/Azure/azure-search-vector-samples/blob/main/demo-python/code/azure-search-vector-image-index-creation-python-sample.ipynb"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Call GPT-4V API with Image"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
    "id": "b6165c63",
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "The apple in the image appears to be a Gala apple.\n"
+      "Gala\n"
      ]
     }
    ],
    "source": [
-    "# Create Azure Search index (the link will be updated once it goes public)\n",
-    "# https://github.com/zhizhoualan/cognitive-search-vector-pr/blob/main/demo-python/code/azure-search-vector-image-index-creation-python-sample.ipynb\n",
-    "\n",
     "# System messages and user prompt\n",
     "sys_message = \"You are an AI assistant that helps people find information.\"\n",
     "user_prompt = \"What are the types of the apple(s) shown in this image?\"\n",
     "\n",
     "# Encode the image in base64\n",
     "image_file_path = \"../../common/images/test_Gala.jpeg\"  # Another example including two apples: \"../../common/images/two_apples.jpeg\".\n",
     "with open(image_file_path, 'rb') as image_file:\n",
-    "    encoded_image = base64.b64encode(image_file.read()).decode('ascii')\n",
-    "    \n",
-    "# Construct the API request URL\n",
-    "api_url = f\"{openai_api_base}/openai/deployments/{deployment_name}/extensions/chat/completions?api-version={openai_api_version}\"\n",
-    "\n",
-    "# Including the api-key in HTTP headers\n",
-    "headers = {\n",
-    "    \"Content-Type\": \"application/json\",\n",
-    "    \"api-key\": openai_api_key,\n",
-    "}\n",
-    "\n",
-    "# Payload for the request\n",
-    "payload = {\n",
-    "  \"model\": \"gpt-4-vision-preview\",    \n",
-    "  \"dataSources\": [\n",
-    "    {\n",
-    "      \"type\": \"AzureCognitiveSearch\",\n",
-    "      \"parameters\": {\n",
-    "        \"endpoint\": search_service_endpoint,\n",
-    "        \"key\": search_query_key,\n",
-    "        \"indexName\": search_index_name\n",
-    "      }\n",
-    "    }\n",
-    "  ],\n",
-    "  \"messages\": [\n",
+    "    encoded_image = base64.b64encode(image_file.read()).decode('utf-8')\n",
+    "  \n",
+    "messages = [\n",
     "    {\n",
     "      \"role\": \"system\",\n",
     "      \"content\": [\n",
@@ -142,20 +129,19 @@
     "          }\n",
     "      ]\n",
     "    }\n",
-    "  ],\n",
-    "  \"temperature\": 0.7,\n",
-    "  \"top_p\": 0.95,\n",
-    "  \"max_tokens\": 800\n",
-    "}\n",
+    "  ]\n",
+    "\n",
+    "in_context_config = {\n",
+    "    'endpoint': search_service_endpoint,\n",
+    "    'key': search_query_key,\n",
+    "    'indexName': search_index_name\n",
+    "}    \n",
     "\n",
-    "# Send the request and handle the response\n",
     "try:\n",
-    "    response = requests.post(api_url, headers=headers, json=payload)\n",
-    "    response.raise_for_status()  # Raise an error for bad HTTP status codes\n",
-    "    response_content = response.json()\n",
-    "    print(response_content['choices'][0]['message']['content'])\n",
-    "except requests.RequestException as e:\n",
-    "    raise SystemExit(f\"Failed to make the request. Error: {e}\")"
+    "    response_content = call_GPT4V_image(messages, in_context=in_context_config)\n",
+    "    print(response_content['choices'][0]['message']['content'])  # Print the content of the response\n",
+    "except Exception as e:\n",
+    "    raise SystemExit(f\"Failed to call GPT-4V API. Error: {e}\")"
    ]
   }
  ],
 
@@ -1,7 +1,19 @@
 
 # Introduction
 
-This repository contains samples demonstrating how to use GPT-4V for Chat Completions via REST API.
+This repository contains a collection of Jupyter notebooks demonstrating various use cases for interacting with the GPT-4V API, along with samples demonstrating how to use GPT-4V for Chat Completions via REST API. These examples provide practical guidance and accelerators for developers integrating GPT-4V functionalities in their applications.
+
+## Contents
+| Notebook | Description | Type |
+|----------|-------------|-------|
+| [Basic Image in GPT-4V](basic_chatcompletions_example_restapi.ipynb) | Processing a single image input with GPT-4V. | Image |
+| [Handling Multiple Images in GPT-4V](mutiple_images_chatcompletions_example_restapi.ipynb) | Managing multiple image inputs in GPT-4V. | Image |
+| [Enhancing GPT-4V with RAG and Custom Data](RAG_chatcompletions_example_restapi.ipynb) |  Enhancing capabilities by bringing custom data to augment image inputs in GPT-4V. | Image |
+| [Enhancing GPT-4V with Grounding Techniques](enhancement_grounding_chatcompletions_example_restapi.ipynb) | Applying grounding techniques to image inputs in GPT-4V. | Image |
+| [Enhancing GPT-4V with OCR Technique](enhancement_OCR_chatcompletions_example_restapi.ipynb) | Incorporating Optical Character Recognition (OCR) with image inputs in GPT-4V. | Image |
+| [Basic Video QnA in GPT-4V](video_chatcompletions_example_restapi.ipynb) | Conducting Q&A with video inputs in GPT-4V. | Video |
+| [Video Chunk Processing Sequentially in GPT-4V](video_chunk_chatcompletions_example_restapi.ipynb) | Sequential processing of video chunks in GPT-4V. | Video |
+
 
 ## Installation
 Install all Python modules and packages listed in the requirements.txt file using the below command.
@@ -11,7 +23,7 @@ pip install -r requirements.txt
 ```
 
 ### Microsoft Azure Endpoints
-In order to use REST API with Microsoft Azure endpoints, you need to set GPT-4V_MODEL, OPENAI_API_BASE, OPENAI_API_VERSION & VISION_API_ENDPOINT in _config.json_ file. 
+In order to use REST API with Microsoft Azure endpoints, you need to set a series of configurations such as GPT-4V_MODEL, OPENAI_API_BASE, OPENAI_API_VERSION & VISION_API_ENDPOINT in _config.json_ file. 
 
 ```js
 {
@@ -20,6 +32,13 @@ In order to use REST API with Microsoft Azure endpoints, you need to set GPT-4V_
     "OPENAI_API_VERSION":"<OpenAI API Version>",
 
     "VISION_API_ENDPOINT": "https://<Your Azure Vision Resource Name>.cognitiveservices.azure.com"
+
+    "AZURE_SEARCH_SERVICE_ENDPOINT": "https://<Your Azure Search Resource Name>.search.windows.net",
+    "AZURE_SEARCH_INDEX_NAME": "<Your Azure Search Index Name>",
+
+    "VIDEO_SAS_URL": "<Your Azure Blob Storage SAS URL>",
+    "VIDEO_INDEX_NAME": "<Your Azure Video Index Name>",
+    "VIDEO_INDEX_ID": "<Your Azure Video Index ID>"
 }
 ``` 
 
@@ -46,7 +65,15 @@ Learn more about Azure OpenAI Service REST API [here](https://learn.microsoft.co
 Python 3.8+ <br>
 Jupyter Notebook 6.5.2
 
-<br>
+
+## Usage
+
+Each notebook is self-contained and includes instructions specific to its scenario. Simply open a notebook in Jupyter and follow the steps outlined within it.
+
+## Shared Functions
+
+For convenience, commonly used functions across these notebooks are consolidated in [shared_functions.ipynb](shared_functions.ipynb). Import these functions in any notebook as needed.
+
 
 ## Trademarks
 
 
@@ -11,57 +11,20 @@
     "# Chat Completions"
    ]
   },
-  {
-   "cell_type": "code",
-   "execution_count": 1,
-   "id": "f4b3d21a",
-   "metadata": {},
-   "outputs": [],
-   "source": [
-    "import json\n",
-    "import os\n",
-    "import requests\n",
-    "import base64"
-   ]
-  },
-  {
-   "cell_type": "markdown",
-   "id": "5b2d4a0f",
-   "metadata": {},
-   "source": [
-    "### Setup Parameters\n",
-    "\n",
-    "\n",
-    "Here we will load the configurations from _config.json_ file to setup deployment_name, openai_api_base, openai_api_key and openai_api_version."
-   ]
-  },
   {
    "cell_type": "code",
    "execution_count": 2,
-   "id": "fd85fb30",
+   "id": "f4b3d21a",
    "metadata": {},
    "outputs": [],
    "source": [
-    "# Load config values\n",
-    "with open(r'config.json') as config_file:\n",
-    "    config_details = json.load(config_file)\n",
-    "    \n",
-    "# Setting up the deployment name\n",
-    "deployment_name = config_details['GPT-4V_MODEL']\n",
-    "\n",
-    "# The base URL for your Azure OpenAI resource. e.g. \"https://<your resource name>.openai.azure.com\"\n",
-    "openai_api_base = config_details['OPENAI_API_BASE']\n",
-    "\n",
-    "# The API key for your Azure OpenAI resource.\n",
-    "openai_api_key = os.getenv(\"OPENAI_API_KEY\")\n",
-    "\n",
-    "# Currently OPENAI API have the following versions available: 2022-12-01. All versions follow the YYYY-MM-DD date structure.\n",
-    "openai_api_version = config_details['OPENAI_API_VERSION']"
+    "import base64\n",
+    "%run shared_functions.ipynb"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 3,
+   "execution_count": 18,
    "id": "aef62557",
    "metadata": {},
    "outputs": [
@@ -70,25 +33,20 @@
      "output_type": "stream",
      "text": [
       "1. Fresh produce\n",
-      "2. Fruits and vegetables\n",
-      "3. Colorful food\n",
-      "4. Healthy eating\n",
-      "5. Organic groceries\n",
-      "6. Variety of produce\n",
-      "7. Vegetarian ingredients\n",
-      "8. Assorted vegetables\n",
-      "9. Tropical fruits\n",
-      "10. Farm fresh\n",
-      "11. Nutrient-rich foods\n",
-      "12. Vegan options\n",
-      "13. Whole foods\n",
-      "14. Raw vegetables\n",
-      "15. Fruit assortment\n",
-      "16. Market produce\n",
-      "17. Dietary fiber sources\n",
-      "18. Natural foods\n",
-      "19. Agriculture harvest\n",
-      "20. Culinary ingredients\n"
+      "2. Assorted fruits\n",
+      "3. Variety of vegetables\n",
+      "4. Healthy food\n",
+      "5. Colorful food assortment\n",
+      "6. Organic produce\n",
+      "7. Raw fruits and vegetables\n",
+      "8. Vegan ingredients\n",
+      "9. Nutritious diet\n",
+      "10. Whole foods\n",
+      "11. Farmers market\n",
+      "12. Seasonal produce\n",
+      "13. Plant-based diet\n",
+      "14. Fresh harvest\n",
+      "15. Food background\n"
      ]
     }
    ],
@@ -109,19 +67,7 @@
     "with open(image_file_path, 'rb') as image_file:\n",
     "    encoded_image = base64.b64encode(image_file.read()).decode('utf-8')\n",
     "\n",
-    "# Construct the API request URL\n",
-    "api_url = f\"{openai_api_base}/openai/deployments/{deployment_name}/chat/completions?api-version={openai_api_version}\"\n",
-    "\n",
-    "# Including the api-key in HTTP headers\n",
-    "headers = {\n",
-    "    \"Content-Type\": \"application/json\",\n",
-    "    \"api-key\": openai_api_key,\n",
-    "}\n",
-    "\n",
-    "# Payload for the request\n",
-    "payload = {\n",
-    "  \"model\": \"gpt-4-vision-preview\",\n",
-    "  \"messages\": [\n",
+    "messages = [\n",
     "    {\n",
     "      \"role\": \"system\",\n",
     "      \"content\": [\n",
@@ -146,20 +92,13 @@
     "          }\n",
     "      ]\n",
     "    }\n",
-    "  ],\n",
-    "  \"temperature\": 0.7,\n",
-    "  \"top_p\": 0.95,\n",
-    "  \"max_tokens\": 800\n",
-    "}\n",
+    "  ]\n",
     "\n",
-    "# Send the request and handle the response\n",
     "try:\n",
-    "    response = requests.post(api_url, headers=headers, json=payload)\n",
-    "    response.raise_for_status()  # Raise an error for bad HTTP status codes\n",
-    "    response_content = response.json()\n",
+    "    response_content = call_GPT4V_image(messages)\n",
     "    print(response_content['choices'][0]['message']['content'])  # Print the content of the response\n",
-    "except requests.RequestException as e:\n",
-    "    raise SystemExit(f\"Failed to make the request. Error: {e}\")"
+    "except Exception as e:\n",
+    "    raise SystemExit(f\"Failed to call GPT-4V API. Error: {e}\")"
    ]
   }
  ],