Morgan Funtowicz
commited on
Commit
·
4976a8c
1
Parent(s):
12f7a48
do not put a space between prompt and content
Browse files- handler.py +2 -3
handler.py
CHANGED
|
@@ -86,15 +86,14 @@ class VllmEmbeddingHandler(Handler):
|
|
| 86 |
embeddings = []
|
| 87 |
num_tokens = 0
|
| 88 |
for idx, document in enumerate(request.inputs):
|
| 89 |
-
input = f"{prompt}
|
| 90 |
-
print(input)
|
| 91 |
|
| 92 |
output = await self.embeds(input, pooling_params, f"{ctx.request_id}-{idx}")
|
| 93 |
num_tokens += len(output[0].prompt_token_ids)
|
| 94 |
embeddings += [output[0].outputs.embedding]
|
| 95 |
else:
|
| 96 |
input = f"{prompt} {request.inputs}" if prompt else request.inputs
|
| 97 |
-
|
| 98 |
output = await self.embeds(input, pooling_params, ctx.request_id)
|
| 99 |
num_tokens = len(output[0].prompt_token_ids)
|
| 100 |
embeddings = output[0].outputs.embedding
|
|
|
|
| 86 |
embeddings = []
|
| 87 |
num_tokens = 0
|
| 88 |
for idx, document in enumerate(request.inputs):
|
| 89 |
+
input = f"{prompt}{document}" if prompt else document
|
|
|
|
| 90 |
|
| 91 |
output = await self.embeds(input, pooling_params, f"{ctx.request_id}-{idx}")
|
| 92 |
num_tokens += len(output[0].prompt_token_ids)
|
| 93 |
embeddings += [output[0].outputs.embedding]
|
| 94 |
else:
|
| 95 |
input = f"{prompt} {request.inputs}" if prompt else request.inputs
|
| 96 |
+
|
| 97 |
output = await self.embeds(input, pooling_params, ctx.request_id)
|
| 98 |
num_tokens = len(output[0].prompt_token_ids)
|
| 99 |
embeddings = output[0].outputs.embedding
|