Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

feat: add solar pro llm and document parser #16099

Open
wants to merge 9 commits into
base: main
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from 3 commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
Original file line number Diff line number Diff line change
@@ -1,11 +1,23 @@
from typing import Optional, Dict, Any, Sequence, Callable
import os
from pathlib import Path
from typing import List, Optional, Dict, Any, Sequence, Callable, Union
import warnings

import httpx
from llama_index.readers.upstage import UpstageDocumentParseReader
from llama_index.llms.openai.utils import (
from_openai_token_logprobs,
create_retry_decorator,
from_openai_message,
)
from llama_index.core.base.llms.types import ChatResponse
from llama_index.core.base.llms.types import LLMMetadata, ChatMessage
from llama_index.llms.openai import OpenAI
from llama_index.llms.openai.base import to_openai_message_dicts

from llama_index.llms.upstage.utils import (
SOLAR_TOKENIZERS,
is_doc_parsing_model,
resolve_upstage_credentials,
is_chat_model,
upstage_modelname_to_contextsize,
Expand All @@ -14,17 +26,25 @@
from llama_index.core.callbacks import CallbackManager
from llama_index.core.constants import DEFAULT_TEMPERATURE
from llama_index.core.types import BaseOutputParser, PydanticProgramMode
from llama_index.core.bridge.pydantic import ConfigDict
from tokenizers import Tokenizer
from pydantic import Field, PrivateAttr
from pydantic import ConfigDict, Field, PrivateAttr
from openai import OpenAI as SyncOpenAI
from openai import AsyncOpenAI

DEFAULT_UPSTAGE_MODEL = "solar-1-mini-chat"

llm_retry_decorator = create_retry_decorator(
max_retries=6,
random_exponential=True,
stop_after_delay_seconds=60,
min_seconds=1,
max_seconds=20,
)


class Upstage(OpenAI):
"""Upstage LLM.
"""
Upstage LLM.
Examples:
`pip install llama-index-llms-upstage`
Expand Down Expand Up @@ -87,7 +107,7 @@ class Upstage(OpenAI):
"Huggingface pretrained tokenizer name "
"upstage opened solar tokenizer in Huggingface. https://huggingface.co/upstage/solar-1-mini-tokenizer"
),
default="upstage/solar-1-mini-tokenizer",
default=SOLAR_TOKENIZERS[DEFAULT_UPSTAGE_MODEL],
)

api_key: str = Field(
Expand Down Expand Up @@ -124,7 +144,7 @@ def __init__(
completion_to_prompt: Optional[Callable[[str], str]] = None,
pydantic_program_mode: PydanticProgramMode = PydanticProgramMode.DEFAULT,
output_parser: Optional[BaseOutputParser] = None,
**kwargs: Any
**kwargs: Any,
) -> None:
if "upstage_api_key" in kwargs:
api_key = kwargs.pop("upstage_api_key")
Expand Down Expand Up @@ -153,7 +173,7 @@ def __init__(
completion_to_prompt=completion_to_prompt,
pydantic_program_mode=pydantic_program_mode,
output_parser=output_parser,
**kwargs
**kwargs,
)

self.tokenizer_name = tokenizer_name
Expand Down Expand Up @@ -187,6 +207,10 @@ def _tokenizer(self) -> Optional[Tokenizer]:
"""
Get a Huggingface tokenizer for solar models.
"""
if SOLAR_TOKENIZERS.get(self.model) != self.tokenizer_name:
warnings.warn(
f"You are using a different tokenizer than the one specified in the model. This may cause issues with token counting. Please use {SOLAR_TOKENIZERS[self.model]} as the tokenizer name."
)
return Tokenizer.from_pretrained(self.tokenizer_name)

def get_num_tokens_from_message(self, messages: Sequence[ChatMessage]) -> int:
Expand All @@ -207,3 +231,50 @@ def get_num_tokens_from_message(self, messages: Sequence[ChatMessage]) -> int:
)
num_tokens += tokens_suffix
return num_tokens

@llm_retry_decorator
def _chat(self, messages: Sequence[ChatMessage], **kwargs: Any) -> ChatResponse:
if is_doc_parsing_model(self.model, kwargs):
Copy link
Collaborator

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

curious why we subclass _chat, but not any other method like _stream_chat or _achat, etc.

Copy link
Collaborator

@logan-markewich logan-markewich Sep 19, 2024

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

I guess you only support parse documents with .chat() ?

Copy link
Contributor Author

@JuHyung-Son JuHyung-Son Oct 8, 2024

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

There was a mistake in following llamaindex interface. Added some more methods.

document_contents = self._parse_documents(kwargs.pop("file_path"))
messages.append(ChatMessage(role="user", content=document_contents))
client = self._get_client()
message_dicts = to_openai_message_dicts(messages)
response = client.chat.completions.create(
messages=message_dicts,
stream=False,
**self._get_model_kwargs(**kwargs),
)
openai_message = response.choices[0].message
message = from_openai_message(openai_message)
openai_token_logprobs = response.choices[0].logprobs
logprobs = None
if openai_token_logprobs and openai_token_logprobs.content:
logprobs = from_openai_token_logprobs(openai_token_logprobs.content)

return ChatResponse(
message=message,
raw=response,
logprobs=logprobs,
additional_kwargs=self._get_response_token_counts(response),
)

def _parse_documents(
self, file_path: Union[str, Path, List[str], List[Path]]
) -> str:
document_contents = "Documents:\n"

loader = UpstageDocumentParseReader(
api_key=self.api_key, output_format="text", coordinates=False
)
docs = loader.load_data(file_path)

if isinstance(file_path, list):
file_titles = [os.path.basename(path) for path in file_path]
else:
file_titles = [os.path.basename(file_path)]

for i, doc in enumerate(docs):
file_title = file_titles[min(i, len(file_titles) - 1)]
document_contents += f"{file_title}:\n{doc.text}\n\n"
print("DOCUMENT CONTENTS", document_contents)
return document_contents
Copy link
Collaborator

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

lets remove this print

Original file line number Diff line number Diff line change
@@ -1,16 +1,27 @@
import logging
from typing import Optional, Tuple
from typing import Any, Dict, Optional, Tuple

from llama_index.core.base.llms.generic_utils import get_from_param_or_env

DEFAULT_UPSTAGE_API_BASE = "https://api.upstage.ai/v1/solar"
DEFAULT_CONTEXT_WINDOW = 32768
CHAT_MODELS = {
"solar-1-mini-chat": 32768,
"solar-pro": 4096,
"solar-docvision": 65536,
}

FUNCTION_CALLING_MODELS = ["solar-1-mini-chat"]
DOC_PARSING_MODELS = ["solar-pro"]

ALL_AVAILABLE_MODELS = {**CHAT_MODELS}

SOLAR_TOKENIZERS = {
"solar-pro": "upstage/solar-pro-preview-tokenizer",
"solar-1-mini-chat": "upstage/solar-1-mini-tokenizer",
"solar-docvision": "upstage/solar-docvision-preview-tokenizer",
}

logger = logging.getLogger(__name__)


Expand Down Expand Up @@ -40,7 +51,15 @@ def is_chat_model(model: str) -> bool:


def is_function_calling_model(model: str) -> bool:
return is_chat_model(model)
return model in FUNCTION_CALLING_MODELS


def is_doc_parsing_model(model: str, kwargs: Dict[str, Any]) -> bool:
if "file_path" in kwargs:
if model in DOC_PARSING_MODELS:
return True
raise ValueError("file_path is not supported for this model.")
return False


def upstage_modelname_to_contextsize(modelname: str) -> int:
Expand Down
Loading
Loading