sync from upstream

2024-06-25 11:19:26 +00:00 · 2024-06-25 11:19:26 +00:00 · 101d1738b6
commit 101d1738b6
parent e9c6756c2e
3 changed files with 8 additions and 107 deletions
--- a/backend/llm.py
+++ b/backend/llm.py
@ -62,7 +62,7 @@ async def stream_openai_response(
    model: Llm,
 ) -> str:
    client = AsyncOpenAI(api_key=api_key, base_url=base_url)
-
+    print(f"--stream_openai_response--{model}")
    # Base parameters
    params = {
        "model": model.value,
@ -105,9 +105,9 @@ async def stream_claude_response(
    callback: Callable[[str], Awaitable[None]],
    model: Llm,
 ) -> str:
-
+    print(f"--stream_openai_response--{model}")
    # client = AsyncAnthropic(api_key=api_key)
-
+    modelId = BEDROCK_LLM_MODELID_LIST[model]
    # Base parameters
    max_tokens = 4096
    temperature = 0.0
@ -256,17 +256,6 @@ async def stream_claude_response_native(
                            response_text += chunk_obj['delta']['text']
                            await callback(chunk_obj['delta']['text'])
                    # if chunk_obj['type'] == 'content_block_delta':
                    #     print(f"\nStop reason: {chunk_obj['delta']['stop_reason']}")
                    #     print(f"Stop sequence: {chunk_obj['delta']['stop_sequence']}")
                    #     print(f"Output tokens: {chunk_obj['usage']['output_tokens']}")
                    #     output_tokens  = chunk_obj['usage']['output_tokens']
                    #     # input_tokens  = chunk_obj['usage']['input_tokens']
                    #     # input_tokens = chunk_obj['amazon-bedrock-invocationMetrics']['inputTokenCount']
                    # if chunk_obj['type'] == 'text_delta':
                    #     print(chunk_obj['delta']['text'])
                    #     response_text += chunk_obj['delta']['text']
                    #     await callback(chunk_obj['delta']['text'])
        print(response_text)
        # Write each pass's code to .html file and thinking to .txt file
@ -304,91 +293,3 @@ async def stream_claude_response_native(
        raise Exception("No HTML response found in AI response")
    else:
        return response_text
 async def stream_claude_response_native_bak(
    system_prompt: str,
    messages: list[Any],
    api_key: str,
    callback: Callable[[str], Awaitable[None]],
    include_thinking: bool = False,
    model: Llm = Llm.CLAUDE_3_OPUS,
 ) -> str:
    client = AsyncAnthropic(api_key=api_key)
    # Base model parameters
    max_tokens = 4096
    temperature = 0.0
    # Multi-pass flow
    current_pass_num = 1
    max_passes = 2
    prefix = "<thinking>"
    response = None
    # For debugging
    full_stream = ""
    debug_file_writer = DebugFileWriter()
    while current_pass_num <= max_passes:
        current_pass_num += 1
        # Set up message depending on whether we have a <thinking> prefix
        messages_to_send = (
            messages + [{"role": "assistant", "content": prefix}]
            if include_thinking
            else messages
        )
        pprint_prompt(messages_to_send)
        async with client.messages.stream(
            model=model.value,
            max_tokens=max_tokens,
            temperature=temperature,
            system=system_prompt,
            messages=messages_to_send,  # type: ignore
        ) as stream:
            async for text in stream.text_stream:
                print(text, end="", flush=True)
                full_stream += text
                await callback(text)
        response = await stream.get_final_message()
        response_text = response.content[0].text
        # Write each pass's code to .html file and thinking to .txt file
        if IS_DEBUG_ENABLED:
            debug_file_writer.write_to_file(
                f"pass_{current_pass_num - 1}.html",
                debug_file_writer.extract_html_content(response_text),
            )
            debug_file_writer.write_to_file(
                f"thinking_pass_{current_pass_num - 1}.txt",
                response_text.split("</thinking>")[0],
            )
        # Set up messages array for next pass
        messages += [
            {"role": "assistant", "content": str(prefix) + response.content[0].text},
            {
                "role": "user",
                "content": "You've done a good job with a first draft. Improve this further based on the original instructions so that the app is fully functional and looks like the original video of the app we're trying to replicate.",
            },
        ]
        print(
            f"Token usage: Input Tokens: {response.usage.input_tokens}, Output Tokens: {response.usage.output_tokens}"
        )
    # Close the Anthropic client
    await client.close()
    if IS_DEBUG_ENABLED:
        debug_file_writer.write_to_file("full_stream.txt", full_stream)
    if not response:
        raise Exception("No HTML response found in AI response")
    else:
        return response.content[0].text
--- a/frontend/src/App.tsx
+++ b/frontend/src/App.tsx
@ -441,7 +441,7 @@ function App() {
                2x faster. Give it a try!
              </p>
            </div>
-          )} */}
+          )} 
          {appState !== AppState.CODE_READY && <TipLink />}
--- a/frontend/src/lib/models.ts
+++ b/frontend/src/lib/models.ts
@ -1,10 +1,10 @@
 // Keep in sync with backend (llm.py)
 // Order here matches dropdown order
 export enum CodeGenerationModel {
-  CLAUDE_3_5_SONNET = "claude_3_5_sonnet",
+  CLAUDE_3_5_SONNET_2024_06_20 = "claude-3-5-sonnet-20240620",
  // CLAUDE_3_5_SONNET = "claude_3_5_sonnet",
  CLAUDE_3_SONNET = "claude_3_sonnet",
  GPT_4O_2024_05_13 = "gpt-4o-2024-05-13",
  CLAUDE_3_5_SONNET_2024_06_20 = "claude-3-5-sonnet-20240620",
  GPT_4_TURBO_2024_04_09 = "gpt-4-turbo-2024-04-09",
  GPT_4_VISION = "gpt_4_vision",
 }
@ -13,10 +13,10 @@ export enum CodeGenerationModel {
 export const CODE_GENERATION_MODEL_DESCRIPTIONS: {
  [key in CodeGenerationModel]: { name: string; inBeta: boolean };
 } = {
  "gpt-4o-2024-05-13": { name: "GPT-4o 🌟", inBeta: false },
  "claude-3-5-sonnet-20240620": { name: "Claude 3.5 Sonnet 🌟", inBeta: false },
  "gpt-4o-2024-05-13": { name: "GPT-4o 🌟", inBeta: false },
  "gpt-4-turbo-2024-04-09": { name: "GPT-4 Turbo (Apr 2024)", inBeta: false },
  gpt_4_vision: { name: "GPT-4 Vision (Nov 2023)", inBeta: false },
  claude_3_sonnet: { name: "Claude 3 Sonnet", inBeta: false },
-  claude_3_5_sonnet: { name: "Claude 3.5 Sonnet", inBeta: false },
+  // claude_3_5_sonnet: { name: "Claude 3.5 Sonnet", inBeta: false },
 };