Skip to content

Commit

Permalink
add AIPC, NVGPU, AMD Rocm support
Browse files Browse the repository at this point in the history
  • Loading branch information
louie-tsai committed Dec 10, 2024
1 parent efa43a2 commit da12881
Show file tree
Hide file tree
Showing 4 changed files with 566 additions and 297 deletions.
71 changes: 71 additions & 0 deletions ChatQnA/tests/ChatQnA_AIPC.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,71 @@
{
"ChatQnA_AIPC": [
{
"service": "env",
"port": "",
"endpoint": "",
"EMBEDDING_MODEL_ID": true,
"RERANK_MODEL_ID": true,
"OLLAMA_MODEL": true,
"OLLAMA_HOST": true,
"INDEX_NAME": true,
"HUGGINGFACEHUB_API_TOKEN": true,
"http_proxy": false,
"https_proxy": false,
"no_proxy": false,
"output": false
},
{
"service": "embed",
"port": "6006",
"endpoint": "embed",
"inputs": "What is Deep Learning?",
"output": "[["
},
{
"service": "dataprep",
"port": "6007",
"endpoint": "/v1/dataprep",
"file_path": "",
"output": "Data preparation succeeded"
},
{
"service": "retrieval",
"port": "7000",
"endpoint": "/v1/retrieval",
"text": "test",
"embedding": "",
"output": "retrieved_docs"
},
{
"service": "rerank",
"port": "8808",
"endpoint": "rerank",
"query": "What is Deep Learning?",
"texts": ["Deep Learning is not...", "Deep learning is..."],
"output": "index"
},
{
"service": "llm",
"port": "11434",
"endpoint": "api/generate",
"model": "llama3.2",
"prompt": "What is Deep Learning?",
"output": "generated_text"
},
{
"service": "nginx",
"port": "80",
"endpoint": "v1/chatqna",
"messages": "What is the revenue of Nike in 2023?",
"output": "data: "
},
{
"service": "mega",
"port": "8888",
"endpoint": "v1/chatqna",
"messages": "What is the revenue of Nike in 2023?",
"output": "data: "
}
]
}
82 changes: 82 additions & 0 deletions ChatQnA/tests/ChatQnA_NVGPU.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,82 @@
{
"ChatQnA_NVGPU": [
{
"service": "env",
"port": "",
"endpoint": "",
"EMBEDDING_MODEL_ID": true,
"RERANK_MODEL_ID": true,
"LLM_MODEL_ID": true,
"INDEX_NAME": true,
"HUGGINGFACEHUB_API_TOKEN": true,
"TEI_EMBEDDING_ENDPOINT": true,
"MEGA_SERVICE_HOST_IP": true,
"RETRIEVER_SERVICE_HOST_IP": true,
"BACKEND_SERVICE_ENDPOINT": true,
"DATAPREP_SERVICE_ENDPOINT": true,
"DATAPREP_GET_FILE_ENDPOINT": true,
"DATAPREP_DELETE_FILE_ENDPOINT": true,
"FRONTEND_SERVICE_IP": true,
"FRONTEND_SERVICE_PORT": true,
"BACKEND_SERVICE_NAME": true,
"BACKEND_SERVICE_IP": true,
"BACKEND_SERVICE_PORT": true,
"http_proxy": false,
"https_proxy": false,
"no_proxy": false,
"output": false
},
{
"service": "embed",
"port": "8090",
"endpoint": "embed",
"inputs": "What is Deep Learning?",
"output": "[["
},
{
"service": "dataprep",
"port": "6007",
"endpoint": "/v1/dataprep",
"file_path": "",
"output": "Data preparation succeeded"
},
{
"service": "retrieval",
"port": "7000",
"endpoint": "/v1/retrieval",
"text": "test",
"embedding": "",
"output": "retrieved_docs"
},
{
"service": "rerank",
"port": "8808",
"endpoint": "rerank",
"query": "What is Deep Learning?",
"texts": ["Deep Learning is not...", "Deep learning is..."],
"output": "index"
},
{
"service": "llm",
"port": "8008",
"endpoint": "v1/chat/completions",
"model": "Intel/neural-chat-7b-v3-3",
"messages": [{ "role": "user", "content": "What is Deep Learning?" }],
"output": "generated_text"
},
{
"service": "nginx",
"port": "80",
"endpoint": "v1/chatqna",
"messages": "What is the revenue of Nike in 2023?",
"output": "data: "
},
{
"service": "mega",
"port": "8888",
"endpoint": "v1/chatqna",
"messages": "What is the revenue of Nike in 2023?",
"output": "data: "
}
]
}
95 changes: 95 additions & 0 deletions ChatQnA/tests/ChatQnA_ROCm.json
Original file line number Diff line number Diff line change
@@ -0,0 +1,95 @@
{
"ChatQnA_ROCm": [
{
"service": "env",
"port": "",
"endpoint": "",
"CHATQNA_HUGGINGFACEHUB_API_TOKEN": true,
"CHATQNA_TGI_SERVICE_IMAGE": true,
"CHATQNA_EMBEDDING_MODEL_ID": true,
"CHATQNA_RERANK_MODEL_ID": true,
"CHATQNA_LLM_MODEL_ID": true,
"CHATQNA_TGI_SERVICE_PORT": true,
"CHATQNA_TEI_EMBEDDING_PORT": true,
"CHATQNA_TEI_EMBEDDING_ENDPOINT": true,
"CHATQNA_TEI_RERANKING_PORT": true,
"CHATQNA_REDIS_VECTOR_PORT": true,
"CHATQNA_REDIS_VECTOR_INSIGHT_PORT": true,
"CHATQNA_REDIS_DATAPREP_PORT": true,
"CHATQNA_REDIS_RETRIEVER_PORT": true,
"CHATQNA_INDEX_NAME": true,
"CHATQNA_MEGA_SERVICE_HOST_IP": true,
"CHATQNA_RETRIEVER_SERVICE_HOST_IP": true,
"CHATQNA_BACKEND_SERVICE_ENDPOINT": true,
"CHATQNA_DATAPREP_SERVICE_ENDPOINT": true,
"CHATQNA_DATAPREP_GET_FILE_ENDPOINT": true,
"CHATQNA_DATAPREP_DELETE_FILE_ENDPOINT": true,
"CHATQNA_FRONTEND_SERVICE_IP": true,
"CHATQNA_FRONTEND_SERVICE_PORT": true,
"CHATQNA_BACKEND_SERVICE_NAME": true,
"CHATQNA_BACKEND_SERVICE_IP": true,
"CHATQNA_BACKEND_SERVICE_PORT": true,
"CHATQNA_REDIS_URL": true,
"CHATQNA_EMBEDDING_SERVICE_HOST_IP": true,
"CHATQNA_RERANK_SERVICE_HOST_IP": true,
"CHATQNA_LLM_SERVICE_HOST_IP": true,
"CHATQNA_NGINX_PORT": true,
"http_proxy": false,
"https_proxy": false,
"no_proxy": false,
"output": false
},
{
"service": "embed",
"port": "8090",
"endpoint": "embed",
"inputs": "What is Deep Learning?",
"output": "[["
},
{
"service": "dataprep",
"port": "6007",
"endpoint": "/v1/dataprep",
"file_path": "",
"output": "Data preparation succeeded"
},
{
"service": "retrieval",
"port": "7000",
"endpoint": "/v1/retrieval",
"text": "test",
"embedding": "",
"output": "retrieved_docs"
},
{
"service": "rerank",
"port": "8808",
"endpoint": "rerank",
"query": "What is Deep Learning?",
"texts": ["Deep Learning is not...", "Deep learning is..."],
"output": "index"
},
{
"service": "llm",
"port": "8008",
"endpoint": "generate",
"inputs": "What is Deep Learning?",
"parameters": { "max_new_tokens": 64, "do_sample": true },
"output": "generated_text"
},
{
"service": "nginx",
"port": "80",
"endpoint": "v1/chatqna",
"messages": "What is the revenue of Nike in 2023?",
"output": "data: "
},
{
"service": "mega",
"port": "8888",
"endpoint": "v1/chatqna",
"messages": "What is the revenue of Nike in 2023?",
"output": "data: "
}
]
}
Loading

0 comments on commit da12881

Please sign in to comment.