mirror of
https://github.com/microsoft/autogen.git
synced 2025-08-31 03:49:56 +00:00

* update readme * update * update * update * update * update * update * add sample project * revert notebook change back * update * update interactive version * add nuget package * refactor Message * update example * add azure nightly build pipeline * Set up CI with Azure Pipelines [skip ci] * Update nightly-build.yml for Azure Pipelines * add dotnet interactive package * add dotnet interactive package * update pipeline * add nuget feed back * remove dotnet-tool feed * remove dotnet-tool feed comment * update pipeline * update build name * Update nightly-build.yml * Delete .github/workflows/dotnet-ci.yml * update * add working_dir to use step * add initateChat api * update oai package * Update dotnet-build.yml * Update dotnet-run-openai-test-and-notebooks.yml * update build workflow * update build workflow * update nuget feed * update nuget feed * update aoai and sk version * Update InteractiveService.cs * add support for GPT 4V * add DalleAndGPT4V example * update example * add user proxy agent * add readme * bump version * update example * add dotnet interactive hook * update * udpate tests * add website * update index.md * add docs * update doc * move sk dependency out of core package * udpate doc * Update Use-function-call.md * add type safe function call document * update doc * update doc * add dock * Update Use-function-call.md * add GenerateReplyOptions * remove IChatLLM * update version * update doc * update website * add sample * fix link * add middleware agent * clean up doc * bump version * update doc * update * add Other Language * remove warnings * add sign.props * add sign step * fix pipelien * auth * real sign * disable PR trigger * update * disable PR trigger * use microbuild machine * update build pipeline to add publish to internal feed * add internal feed * fix build pipeline * add dotnet prefix * update ci * add build number * update run number * update source * update token * update * remove adding source * add publish to github package * try again * try again * ask for write pacakge * disable package when branch is not main * update * implement streaming agent * add test for streaming function call * update * fix #1588 * enable PR check for dotnet branch * add website readme * only publish to dotnet feed when pushing to dotnet branch * remove openai-test-and-notebooks workflow * update readme * update readme * update workflow * update getting-start * upgrade test and sample proejct to use .net 8 * fix global.json format && make loadFromConfig API internal only before implementing * update * add support for LM studio * add doc * Update README.md * add push and workflow_dispatch trigger * disable PR for main * add dotnet env * Update Installation.md * add nuget * refer to newtonsoft 13 * update branch to dotnet in docfx * Update Installation.md * pull out HumanInputMiddleware and FunctionCallMiddleware * fix tests * add link to sample folder * refactor message * refactor over IMessage * add more tests * add more test * fix build error * rename header * add semantic kernel project * update sk example * update dotnet version * add LMStudio function call example * rename LLaMAFunctin * remove dotnet run openai test and notebook workflow * add FunctionContract and test * update doc * add documents * add workflow * update * update sample * fix warning in test * reult length can be less then maximumOutputToKeep (#1804) * merge with main * add option to retrieve inner agent and middlewares from MiddlewareAgent * update doc * adjust namespace * update readme * fix test * use IMessage * more updates * update * fix test * add comments * use FunctionContract to replace FunctionDefinition * move AutoGen contrac to AutoGen.Core * update installation * refactor streamingAgent by adding StreamingMessage type * update sample * update samples * update * update * add test * fix test * bump version * add openaichat test * update * Update Example03_Agent_FunctionCall.cs * [.Net] improve docs (#1862) * add doc * add doc * add doc * add doc * add doc * add doc * update * fix test error * fix some error * fix test * fix test * add more tests * edits --------- Co-authored-by: ekzhu <ekzhu@users.noreply.github.com> * [.Net] Add fill form example (#1911) * add form filler example * update * fix ci error * [.Net] Add using AutoGen.Core in source generator (#1983) * fix using namespace bug in source generator * remove using in sourcegenerator test * disable PR test * Add .idea to .gitignore (#1988) * [.Net] publish to nuget.org feed (#1987) * publish to nuget * update ci * update dotnet-release * update release pipeline * add source * remove empty symbol package * update pipeline * remove tag * update installation guide * [.Net] Rename some classes && APIs based on doc review (#1980) * rename sequential group chat to round robin group chat * rename to sendInstruction * rename workflow to graph * rename some api * bump version * move Graph to GroupChat folder * rename fill application example * [.Net] Improve package description (#2161) * add discord link and update package description * Update getting-start.md * [.Net] Fix document comment from the most recent AutoGen.Net engineer sync (#2231) * update * rename RegisterPrintMessageHook to RegisterPrintMessage * update website * update update.md * fix link error * [.Net] Enable JsonMode and deterministic output in AutoGen.OpenAI OpenAIChatAgent (#2347) * update openai version && add sample for json output * add example in web * update update.md * update image url * [.Net] Add AutoGen.Mistral package (#2330) * add mstral client * enable streaming support * add mistralClientAgent * add test for function call * add extension * add support for toolcall and toolcall result message * add support for aggregate message * implement streaming function call * track (#2471) * [.Net] add mistral example (#2482) * update existing examples to use messageCOnnector * add overview * add function call document * add example 14 * add mistral token count usage example * update version * Update dotnet-release.yml (#2488) * update * revert gitattributes --------- Co-authored-by: mhensen <mh@webvize.nl> Co-authored-by: ekzhu <ekzhu@users.noreply.github.com> Co-authored-by: Krzysztof Kasprowicz <60486987+Krzysztof318@users.noreply.github.com>
153 lines
6.0 KiB
C#
153 lines
6.0 KiB
C#
// Copyright (c) Microsoft Corporation. All rights reserved.
|
|
// Example05_Dalle_And_GPT4V.cs
|
|
|
|
using AutoGen;
|
|
using AutoGen.Core;
|
|
using Azure.AI.OpenAI;
|
|
using FluentAssertions;
|
|
using autogen = AutoGen.LLMConfigAPI;
|
|
|
|
public partial class Example05_Dalle_And_GPT4V
|
|
{
|
|
private readonly OpenAIClient openAIClient;
|
|
|
|
public Example05_Dalle_And_GPT4V(OpenAIClient openAIClient)
|
|
{
|
|
this.openAIClient = openAIClient;
|
|
}
|
|
|
|
/// <summary>
|
|
/// Generate image from prompt using DALL-E.
|
|
/// </summary>
|
|
/// <param name="prompt">prompt with feedback</param>
|
|
/// <returns></returns>
|
|
[Function]
|
|
public async Task<string> GenerateImage(string prompt)
|
|
{
|
|
// TODO
|
|
// generate image from prompt using DALL-E
|
|
// and return url.
|
|
var option = new ImageGenerationOptions
|
|
{
|
|
Size = ImageSize.Size1024x1024,
|
|
Style = ImageGenerationStyle.Vivid,
|
|
ImageCount = 1,
|
|
Prompt = prompt,
|
|
Quality = ImageGenerationQuality.Standard,
|
|
DeploymentName = "dall-e-3",
|
|
};
|
|
|
|
var imageResponse = await openAIClient.GetImageGenerationsAsync(option);
|
|
var imageUrl = imageResponse.Value.Data.First().Url.OriginalString;
|
|
|
|
return $@"// ignore this line [IMAGE_GENERATION]
|
|
The image is generated from prompt {prompt}
|
|
|
|
{imageUrl}";
|
|
}
|
|
|
|
public static async Task RunAsync()
|
|
{
|
|
// This example shows how to use DALL-E and GPT-4V to generate image from prompt and feedback.
|
|
// The DALL-E agent will generate image from prompt.
|
|
// The GPT-4V agent will provide feedback to DALL-E agent to help it generate better image.
|
|
// The conversation will be terminated when the image satisfies the condition.
|
|
// The image will be saved to image.jpg in current directory.
|
|
|
|
// get OpenAI Key and create config
|
|
var openAIKey = Environment.GetEnvironmentVariable("OPENAI_API_KEY") ?? throw new Exception("Please set OPENAI_API_KEY environment variable.");
|
|
var gpt35Config = autogen.GetOpenAIConfigList(openAIKey, new[] { "gpt-3.5-turbo" });
|
|
var gpt4vConfig = autogen.GetOpenAIConfigList(openAIKey, new[] { "gpt-4-vision-preview" });
|
|
var openAIClient = new OpenAIClient(openAIKey);
|
|
var instance = new Example05_Dalle_And_GPT4V(openAIClient);
|
|
var imagePath = Path.Combine(Environment.CurrentDirectory, "image.jpg");
|
|
if (File.Exists(imagePath))
|
|
{
|
|
File.Delete(imagePath);
|
|
}
|
|
|
|
var dalleAgent = new AssistantAgent(
|
|
name: "dalle",
|
|
systemMessage: "You are a DALL-E agent that generate image from prompt, when conversation is terminated, return the most recent image url",
|
|
llmConfig: new ConversableAgentConfig
|
|
{
|
|
Temperature = 0,
|
|
ConfigList = gpt35Config,
|
|
FunctionContracts = new[]
|
|
{
|
|
instance.GenerateImageFunctionContract,
|
|
},
|
|
},
|
|
functionMap: new Dictionary<string, Func<string, Task<string>>>
|
|
{
|
|
{ nameof(GenerateImage), instance.GenerateImageWrapper },
|
|
})
|
|
.RegisterMiddleware(async (msgs, option, agent, ct) =>
|
|
{
|
|
// if last message contains [TERMINATE], then find the last image url and terminate the conversation
|
|
if (msgs.Last().GetContent()?.Contains("TERMINATE") is true)
|
|
{
|
|
var lastMessageWithImage = msgs.Last(msg => msg is ImageMessage) as ImageMessage;
|
|
var lastImageUrl = lastMessageWithImage.Url;
|
|
Console.WriteLine($"download image from {lastImageUrl} to {imagePath}");
|
|
var httpClient = new HttpClient();
|
|
var imageBytes = await httpClient.GetByteArrayAsync(lastImageUrl);
|
|
File.WriteAllBytes(imagePath, imageBytes);
|
|
|
|
var messageContent = $@"{GroupChatExtension.TERMINATE}
|
|
|
|
{lastImageUrl}";
|
|
return new TextMessage(Role.Assistant, messageContent)
|
|
{
|
|
From = "dalle",
|
|
};
|
|
}
|
|
|
|
var reply = await agent.GenerateReplyAsync(msgs, option, ct);
|
|
|
|
if (reply.GetContent() is string content && content.Contains("IMAGE_GENERATION"))
|
|
{
|
|
var imageUrl = content.Split("\n").Last();
|
|
var imageMessage = new ImageMessage(Role.Assistant, imageUrl, from: reply.From);
|
|
|
|
return imageMessage;
|
|
}
|
|
else
|
|
{
|
|
return reply;
|
|
}
|
|
})
|
|
.RegisterPrintMessage();
|
|
|
|
var gpt4VAgent = new AssistantAgent(
|
|
name: "gpt4v",
|
|
systemMessage: @"You are a critism that provide feedback to DALL-E agent.
|
|
Carefully check the image generated by DALL-E agent and provide feedback.
|
|
If the image satisfies the condition, then terminate the conversation by saying [TERMINATE].
|
|
Otherwise, provide detailed feedback to DALL-E agent so it can generate better image.
|
|
|
|
The image should satisfy the following conditions:
|
|
- There should be a cat and a mouse in the image
|
|
- The cat should be chasing after the mouse
|
|
",
|
|
llmConfig: new ConversableAgentConfig
|
|
{
|
|
Temperature = 0,
|
|
ConfigList = gpt4vConfig,
|
|
})
|
|
.RegisterPrintMessage();
|
|
|
|
IEnumerable<IMessage> conversation = new List<IMessage>()
|
|
{
|
|
new TextMessage(Role.User, "Hey dalle, please generate image from prompt: English short hair blue cat chase after a mouse")
|
|
};
|
|
var maxRound = 20;
|
|
await gpt4VAgent.InitiateChatAsync(
|
|
receiver: dalleAgent,
|
|
message: "Hey dalle, please generate image from prompt: English short hair blue cat chase after a mouse",
|
|
maxRound: maxRound);
|
|
|
|
File.Exists(imagePath).Should().BeTrue();
|
|
}
|
|
}
|