Skip to content

Commit

Permalink
use archfc hosted on aws (#409)
Browse files Browse the repository at this point in the history
  • Loading branch information
adilhafeez authored Feb 13, 2025
1 parent 28ee14a commit 4ec03af
Show file tree
Hide file tree
Showing 5 changed files with 10 additions and 9 deletions.
2 changes: 1 addition & 1 deletion model_server/src/commons/globals.py
Original file line number Diff line number Diff line change
Expand Up @@ -15,7 +15,7 @@


# Define the client
ARCH_ENDPOINT = os.getenv("ARCH_ENDPOINT", "https://api.fc.archgw.com/v1")
ARCH_ENDPOINT = os.getenv("ARCH_ENDPOINT", "https://archfc.katanemo.dev/v1")
ARCH_API_KEY = "EMPTY"
ARCH_CLIENT = OpenAI(base_url=ARCH_ENDPOINT, api_key=ARCH_API_KEY)

Expand Down
4 changes: 3 additions & 1 deletion model_server/src/main.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,7 +4,7 @@
import logging
import src.commons.utils as utils

from src.commons.globals import handler_map
from src.commons.globals import ARCH_ENDPOINT, handler_map
from src.core.utils.model_utils import (
ChatMessage,
ChatCompletionResponse,
Expand Down Expand Up @@ -51,6 +51,8 @@
app = FastAPI()
FastAPIInstrumentor().instrument_app(app)

logger.info(f"using archfc endpoint: {ARCH_ENDPOINT}")


@app.get("/healthz")
async def healthz():
Expand Down
5 changes: 2 additions & 3 deletions tests/rest/api_model_server.rest
Original file line number Diff line number Diff line change
@@ -1,6 +1,5 @@
@model_server_endpoint = http://localhost:51000
@archfc_endpoint = https://api.fc.archgw.com

@archfc_endpoint = https://archfc.katanemo.dev

### talk to function calling endpoint
POST {{model_server_endpoint}}/function_calling HTTP/1.1
Expand Down Expand Up @@ -119,7 +118,7 @@ Content-Type: application/json
}

### talk to Arch-Intent directly for completion
POST {{archfc_endpoint}}/v1/chat/completions HTTP/1.1
POST {{{{archfc_endpoint}}}}/v1/chat/completions HTTP/1.1
Content-Type: application/json

{
Expand Down
6 changes: 3 additions & 3 deletions tests/rest/insurance_agent.rest
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
@model_server_endpoint = http://localhost:51000
@archfc_endpoint = https://api.fc.archgw.com
@archfc_endpoint = https://archfc.katanemo.dev

### multi turn conversation with intent, except parameter gathering

Expand Down Expand Up @@ -55,7 +55,7 @@ Content-Type: application/json
]
}
### talk to Arch-Intent directly for completion
POST https://api.fc.archgw.com/v1/chat/completions HTTP/1.1
POST https://archfc.katanemo.dev/v1/chat/completions HTTP/1.1
Content-Type: application/json

{
Expand Down Expand Up @@ -126,7 +126,7 @@ Content-Type: application/json
]
}
### talk to Arch-Intent directly for completion, expect No
POST https://api.fc.archgw.com/v1/chat/completions HTTP/1.1
POST https://archfc.katanemo.dev/v1/chat/completions HTTP/1.1
Content-Type: application/json

{
Expand Down
2 changes: 1 addition & 1 deletion tests/rest/network_agent.rest
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
@model_server_endpoint = http://localhost:51000
@archfc_endpoint = https://api.fc.archgw.com
@archfc_endpoint = https://archfc.katanemo.dev

### single turn function calling all parameters insurance agent summary

Expand Down

0 comments on commit 4ec03af

Please sign in to comment.