from llama_index.llms.cometapi import CometLLMimport osos.environ["COMETAPI_KEY"] = "<COMETAPI_KEY>"api_key = os.getenv("COMETAPI_KEY")
使用環境變數比在腳本中硬編碼憑證更安全。
3
初始化模型並進行補全呼叫
from llama_index.core.llms import ChatMessagellm = CometLLM( api_key=api_key, max_tokens=256, context_window=4096, model="your-model-id",)# Chat callmessages = [ ChatMessage(role="system", content="You are a helpful assistant"), ChatMessage(role="user", content="Say 'Hi' only!"),]resp = llm.chat(messages)print(resp)# Completion callresp = llm.complete("Who is Kaiming He?")print(resp)
4
啟用串流
使用 stream_chat 或 stream_complete 以取得即時分塊輸出:
# Streaming chatmessage = ChatMessage(role="user", content="Tell me what ResNet is")for chunk in llm.stream_chat([message]): print(chunk.delta, end="")# Streaming completionfor chunk in llm.stream_complete("Tell me about Large Language Models"): print(chunk.delta, end="")