Method model_dump

optillm/inference.py:1712–1741 · view source on GitHub ↗

(self)

Source from the content-addressed store, hash-verified

1710	self.usage = ChatCompletionUsage(**response_dict["usage"])
1711
1712	def model_dump(self) -> Dict:
1713	return {
1714	"id": self.id,
1715	"object": self.object,
1716	"created": self.created,
1717	"model": self.model,
1718	"choices": [
1719	{
1720	"index": choice.index,
1721	"message": {
1722	"role": choice.message.role,
1723	"content": choice.message.content,
1724	"logprobs": choice.message.logprobs
1725	} if choice.message.logprobs else {
1726	"role": choice.message.role,
1727	"content": choice.message.content
1728	},
1729	"finish_reason": choice.finish_reason
1730	}
1731	for choice in self.choices
1732	],
1733	"usage": {
1734	"prompt_tokens": self.usage.prompt_tokens,
1735	"completion_tokens": self.usage.completion_tokens,
1736	"total_tokens": self.usage.total_tokens,
1737	"completion_tokens_details": {
1738	"reasoning_tokens": getattr(self.usage, 'reasoning_tokens', 0)
1739	}
1740	}
1741	}
1742
1743	class InferenceClient:
1744	"""OpenAI SDK Compatible client for local inference with dynamic model support"""

test_chat_completion_model_dump_structureMethod · 0.95

test_chat_completion_model_dump_includes_reasoning_tokensMethod · 0.95

test_chat_completion_response_structureMethod · 0.95

get_llm_responseFunction · 0.45

mixture_of_agentsFunction · 0.45

cot_reflectionFunction · 0.45

generate_responseMethod · 0.45

re2_approachFunction · 0.45

extract_examples_from_queryMethod · 0.45

generate_mistakesMethod · 0.45

generate_low_level_principlesMethod · 0.45

generate_high_level_principlesMethod · 0.45

no outgoing calls

test_chat_completion_model_dump_structureMethod · 0.76

test_chat_completion_model_dump_includes_reasoning_tokensMethod · 0.76

test_chat_completion_response_structureMethod · 0.76