implement local vllm model usage
Run Tests / Run Tests (push) Successful in 46s Details

This commit is contained in:
James Ravenscroft 2024-12-11 16:12:52 +00:00
parent 9222739df1
commit f7db98d91e
5 changed files with 18 additions and 11 deletions

View File

@ -8,7 +8,7 @@ services:
vllm: vllm:
image: vllm/vllm-openai:latest image: vllm/vllm-openai:latest
command: "--model Qwen/Qwen2-VL-2B-Instruct" command: "--model Qwen/Qwen2-VL-2B-Instruct-GPTQ-Int4 --quantization gptq"
volumes: volumes:
- ~/.cache/huggingface:/root/.cache/huggingface - ~/.cache/huggingface:/root/.cache/huggingface
ports: ports:
@ -21,4 +21,4 @@ services:
devices: devices:
- driver: nvidia - driver: nvidia
device_ids: ["0"] device_ids: ["0"]
capabilities: [gpu] capabilities: [gpu]

View File

@ -149,5 +149,6 @@ CELERY_BROKER_URL = "amqp://guest:guest@localhost/"
OPENAI_API_BASE = os.getenv("OPENAI_API_BASE") OPENAI_API_BASE = os.getenv("OPENAI_API_BASE")
OPENAI_API_KEY = os.getenv("OPENAI_API_KEY") #OPENAI_API_KEY = os.getenv("OPENAI_API_KEY")
OPENAI_API_KEY = "test"
OPENAI_MODEL = os.getenv("OPENAI_MODEL", "openai/gpt-4o") OPENAI_MODEL = os.getenv("OPENAI_MODEL", "openai/gpt-4o")

View File

@ -1,26 +1,26 @@
import requests
import base64 import base64
import litellm import litellm
import os
from loguru import logger from loguru import logger
from celery import shared_task, Task from celery import shared_task
from django.db import transaction from django.db import transaction
from django.core.files.storage import default_storage from django.core.files.storage import default_storage
from django.conf import settings from django.conf import settings
from .models import ImageMemo, MemoStatus from .models import ImageMemo, MemoStatus
from datetime import datetime
TRANSCRIBE_PROMPT = """Transcribe the hand written notes in the attached image and present them as markdown. TRANSCRIBE_PROMPT = """Transcribe the hand written notes in the attached image and present them as markdown.
Do not use a fence, simply respond using markdown. Do not use a fence, simply respond using markdown.
If any words or letters are unclear, denote them with a '?<word>?'. If any words or letters are unclear, denote them with a '?<word>?'.
For example if you were not sure whether a word is blow or blew you would transcribe it as '?blow?' For example if you were not sure whether a word is blow or blew you would transcribe it as '?blow?'
Please include whitespace and formatting for headings too.
""" """
@shared_task @shared_task
def process_memo(memo_id: str): def process_memo(memo_id: str):
"""Run OCR on a memo and store the output""" """Run OCR on a memo and store the output"""
@ -67,6 +67,7 @@ def process_memo(memo_id: str):
response = litellm.completion( response = litellm.completion(
model=settings.OPENAI_MODEL, #os.getenv("MODEL", "openai/gpt-4o"), model=settings.OPENAI_MODEL, #os.getenv("MODEL", "openai/gpt-4o"),
messages=[message], messages=[message],
temperature=0.01
) )
response.choices[0].message["content"] response.choices[0].message["content"]

View File

@ -36,11 +36,11 @@
</tr> </tr>
<tr> <tr>
<td class="font-medium pr-4">Created:</td> <td class="font-medium pr-4">Created:</td>
<td class="text-gray-600">{{ document.created_at|date:"d/m/Y H:i" }}</td> <td class="text-gray-600">{{ document.created_at|date:"d/m/Y H:i:s" }}</td>
</tr> </tr>
<tr> <tr>
<td class="font-medium pr-4">Updated:</td> <td class="font-medium pr-4">Updated:</td>
<td class="text-gray-600">{{ document.updated_at|date:"d/m/Y H:i" }}</td> <td class="text-gray-600">{{ document.updated_at|date:"d/m/Y H:i:s" }}</td>
</tr> </tr>
</table> </table>
{% if document.content %} {% if document.content %}

View File

@ -1,5 +1,10 @@
version = 1 version = 1
requires-python = ">=3.9" requires-python = ">=3.9"
resolution-markers = [
"python_full_version < '3.11'",
"python_full_version == '3.11.*'",
"python_full_version >= '3.12'",
]
[[package]] [[package]]
name = "aiohappyeyeballs" name = "aiohappyeyeballs"