AGInfer/gist:1ffe88623c0b903fb594425a966c46ae Secret

## gistfile1.txt
from vllm import LLM, SamplingParams

class InferlessPythonModel:
    def initialize(self):
        self.sampling_params = SamplingParams(temperature=0.7, top_p=0.95,max_tokens=256)
        self.llm = LLM(model="TheBloke/Mistral-7B-v0.1-AWQ", quantization="awq", dtype="float16",max_model_len=2048, gpu_memory_utilization=0.9)

    def infer(self, inputs):
        prompts = inputs["prompt"]
        result = self.llm.generate(prompts, self.sampling_params)
        result_output = [output.outputs[0].text for output in result]

        return {'gresult': result_output[0]}

    def finalize(self):
        pass
	from vllm import LLM, SamplingParams

	class InferlessPythonModel:
	def initialize(self):
	self.sampling_params = SamplingParams(temperature=0.7, top_p=0.95,max_tokens=256)
	self.llm = LLM(model="TheBloke/Mistral-7B-v0.1-AWQ", quantization="awq", dtype="float16",max_model_len=2048, gpu_memory_utilization=0.9)

	def infer(self, inputs):
	prompts = inputs["prompt"]
	result = self.llm.generate(prompts, self.sampling_params)
	result_output = [output.outputs[0].text for output in result]

	return {'gresult': result_output[0]}

	def finalize(self):
	pass