Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

Update VideoAnalyzer #35

Merged
merged 1 commit into from
Apr 21, 2024
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
8 changes: 8 additions & 0 deletions infra/main.tf
Original file line number Diff line number Diff line change
Expand Up @@ -24,6 +24,7 @@ locals {
ca_prep_docs_name = "${var.ca_prep_docs_name}${local.name_sufix}"
ca_aihub_name = "${var.ca_aihub_name}${local.name_sufix}"
func_name = "plugin${local.sufix}"
cv_name = "${var.cv_name}${local.name_sufix}"
}

resource "azurerm_resource_group" "rg" {
Expand Down Expand Up @@ -245,3 +246,10 @@ module "plugin" {
openai_model = module.openai.gpt_deployment_name
openai_endpoint = module.openai.openai_endpoint
}

module "cv" {
source = "./modules/cv"
location = azurerm_resource_group.rg.location
resource_group_name = azurerm_resource_group.rg.name
cv_name = local.cv_name
}
7 changes: 7 additions & 0 deletions infra/modules/cv/main.tf
Original file line number Diff line number Diff line change
@@ -0,0 +1,7 @@
resource "azurerm_cognitive_account" "cv" {
name = var.cv_name
location = var.location
resource_group_name = var.resource_group_name
kind = "Face"
sku_name = "S0"
}
Empty file added infra/modules/cv/outputs.tf
Empty file.
3 changes: 3 additions & 0 deletions infra/modules/cv/variables.tf
Original file line number Diff line number Diff line change
@@ -0,0 +1,3 @@
variable "resource_group_name" {}
variable "location" {}
variable "cv_name" {}
6 changes: 6 additions & 0 deletions infra/modules/st/main.tf
Original file line number Diff line number Diff line change
Expand Up @@ -41,6 +41,12 @@ resource "azurerm_storage_container" "image-analyzer" {
storage_account_name = azurerm_storage_account.sa.name
}

resource "azurerm_storage_container" "image-analyzer" {
name = "video-analyzer"
container_access_type = "private"
storage_account_name = azurerm_storage_account.sa.name
}

resource "azurerm_storage_container" "image-moderator" {
name = "image-moderator"
container_access_type = "private"
Expand Down
4 changes: 4 additions & 0 deletions infra/variables.tf
Original file line number Diff line number Diff line change
Expand Up @@ -86,6 +86,10 @@ variable "ca_aihub_name" {
default = "ca-aihub"
}

variable "cv_name" {
default = "cv-aihub"
}

variable "ca_chat_image" {
default = "ghcr.io/azure/activate-genai/aihub-chat:1.0.0-preview.0"
}
Expand Down
29 changes: 17 additions & 12 deletions src/AIHub/Controllers/VideoAnalyzerController.cs
Original file line number Diff line number Diff line change
Expand Up @@ -26,6 +26,8 @@ public class VideoAnalyzerController : Controller
private VideoAnalyzerModel model;
private HttpClient httpClient;



public VideoAnalyzerController(IConfiguration config, IHttpClientFactory clientFactory)
{
AOAIendpoint = config.GetValue<string>("VideoAnalyzer:OpenAIEndpoint") ?? throw new ArgumentNullException("OpenAIEndpoint");
Expand Down Expand Up @@ -117,9 +119,6 @@ public async Task<IActionResult> DenseCaptionVideo(string video_url, string prom
string VISION_API_ENDPOINT = $"{Visionendpoint}computervision";
string VISION_API_KEY = VisionKey;
string VIDEO_INDEX_NAME = Regex.Replace(video_url.Split("/").Last().Split(".").First().GetHashCode().ToString(), "[^a-zA-Z0-9]", "");



string VIDEO_FILE_SAS_URL = video_url + sasUri.Query;

// Step 1: Create an Index
Expand Down Expand Up @@ -149,6 +148,7 @@ public async Task<IActionResult> DenseCaptionVideo(string video_url, string prom
}
var payload = new
{
model = "gpt-4-vision-preview",
dataSources = new[]
{
new
Expand All @@ -157,8 +157,8 @@ public async Task<IActionResult> DenseCaptionVideo(string video_url, string prom
parameters = new
{
computerVisionBaseUrl = VISION_API_ENDPOINT,
computerVisionApiKey = VisionKey,
indexName = Regex.Replace(video_url.Split("/").Last().Split(".").First().GetHashCode().ToString(), "[^a-zA-Z0-9]", ""),
computerVisionApiKey = VISION_API_KEY,
indexName = VIDEO_INDEX_NAME,
videoUrls = new[] { VIDEO_FILE_SAS_URL }
}
}
Expand All @@ -180,26 +180,31 @@ public async Task<IActionResult> DenseCaptionVideo(string video_url, string prom
role = "user",
content = new object[]
{
new acvDocumentIdWrapper() {AcvDocumentId = VIDEO_DOCUMENT_ID},
prompt
new {
type = "acv_document_id",
acv_document_id = VIDEO_DOCUMENT_ID
},
new {
type = "text",
text = prompt
}
},
}
},
temperature = 0.7,
top_p = 0.95,
max_tokens = 800
max_tokens = 4096
};

try
{
var chatResponse = await httpClient.PostAsync(GPT4V_ENDPOINT, new StringContent(JsonSerializer.Serialize(payload), Encoding.UTF8, "application/json"));
chatResponse.EnsureSuccessStatusCode();
var responseContent = JsonSerializer.Deserialize<dynamic>(await chatResponse.Content.ReadAsStringAsync());
var responseContent = JsonSerializer.Deserialize<JsonObject>(await chatResponse.Content.ReadAsStringAsync());
Console.WriteLine(responseContent);

model.Message = responseContent; //responseContent!.choices[0].message.content;
model.Message = responseContent?["choices"]?[0]?["message"]?["content"]?.ToString();
model.Video = VIDEO_FILE_SAS_URL;

}
catch
{
Expand Down
4 changes: 3 additions & 1 deletion src/AIHub/Views/VideoAnalyzer/VideoAnalyzer.cshtml
Original file line number Diff line number Diff line change
Expand Up @@ -102,7 +102,9 @@
<div class="row g-0 align-items-center">
<div class="col-md-4">
<div class="ratio ratio-16x9">
<iframe id="bigpic" src="@Model.Video"></iframe>
<video id="bigpic" width="320" height="240" controls>
<!--- Here we have to insert the source video throught javascript -->
</video>
</div>
</div>
<div class="col-md-8">
Expand Down
4 changes: 2 additions & 2 deletions src/AIHub/appsettings.template.json
Original file line number Diff line number Diff line change
Expand Up @@ -37,9 +37,9 @@
"VideoAnalyzer": {
"OpenAIEndpoint": "<AOAI EndPoint>",
"GPT4Vision": "openai/deployments/<deploymentName>/extensions/chat/completions?api-version=2023-07-01-preview",
"VisionAPI": "https://<deploymentName>.cognitiveservices.azure.com/",
"VisionKey": "<Vision Key>",
"OpenAISubscriptionKey": "<AOAI Key>",
"VisionEndpoint": "https://<deploymentName>.cognitiveservices.azure.com/",
"VisionSubscriptionKey": "<Vision Key>",
"ContainerName": "video-analyzer",
"DeploymentName": "gpt4-vision"
},
Expand Down
24 changes: 17 additions & 7 deletions src/AIHub/wwwroot/js/ui/videoanalyzer.js
Original file line number Diff line number Diff line change
@@ -1,30 +1,40 @@
Dropzone.options.dropaiimage = {
paramName: "videoFile",
Dropzone.options.dropaiimage = {
paramName: "videoFile",
maxFilesize: 200, // MB
createImageThumbnails:true,
previewsContainer: "#file-previews",
accept: function(file, done) {
done();
},
init: function() {
init: function() {
var myDropzone = this;
myDropzone.on("sending", function(file) {
myDropzone.on("sending", function(file) {
$("#loader").removeClass("d-none");
});
myDropzone.on("complete",
myDropzone.on("complete",
function(file) {
$("#loader").addClass("d-none");
});
},
success: function (file, response) {
if (typeof response === "object") {
$("#show-message-result").text(response.message);
$("#bigpic").attr('src', response.video);

var isrc = document.createElement("source");
isrc.setAttribute("src", response.video);
isrc.setAttribute("type", "video/mp4");
document.getElementById("bigpic").appendChild(isrc);

} else {
try {
var parsedResponse = JSON.parse(response);
$("#show-message-result").val(parsedResponse.message);
$("#bigpic").attr('src',parsedResponse.video);

var isrc = document.createElement("source");
isrc.setAttribute("src", parsedResponse.video);
isrc.setAttribute("type", "video/mp4");
document.getElementById("bigpic").appendChild(isrc);

} catch (e) {
console.error("Error parsing the response:", e);
}
Expand Down
Loading