From c12390a0dafb1699a9121c624d944f47dac2543d Mon Sep 17 00:00:00 2001 From: Sophie Chen <39424052+SophieGarden@users.noreply.github.com> Date: Thu, 9 May 2024 18:14:23 -0700 Subject: [PATCH] remove duplicates.. (#850) Co-authored-by: Sophie Chen --- scripts/data_utils.py | 25 ------------------------- 1 file changed, 25 deletions(-) diff --git a/scripts/data_utils.py b/scripts/data_utils.py index 41802f6301..042df69e9c 100644 --- a/scripts/data_utils.py +++ b/scripts/data_utils.py @@ -689,31 +689,6 @@ def get_embedding(text, embedding_model_endpoint=None, embedding_model_key=None, except Exception as e: raise Exception(f"Error getting embeddings with endpoint={endpoint} with error={e}") -def get_embedding(text, embedding_model_endpoint=None, embedding_model_key=None, azure_credential=None): - endpoint = embedding_model_endpoint if embedding_model_endpoint else os.environ.get("EMBEDDING_MODEL_ENDPOINT") - key = embedding_model_key if embedding_model_key else os.environ.get("EMBEDDING_MODEL_KEY") - - if azure_credential is None and (endpoint is None or key is None): - raise Exception("EMBEDDING_MODEL_ENDPOINT and EMBEDDING_MODEL_KEY are required for embedding") - - try: - endpoint_parts = endpoint.split("/openai/deployments/") - base_url = endpoint_parts[0] - deployment_id = endpoint_parts[1].split("/embeddings")[0] - - api_version = endpoint_parts[1].split("api-version=")[1].split("&")[0] - - if azure_credential is not None: - api_key = azure_credential.get_token("https://cognitiveservices.azure.com/.default").token - else: - api_key = key - - client = AzureOpenAI(api_version=api_version, azure_endpoint=base_url, azure_ad_token=api_key) - embeddings = client.embeddings.create(model=deployment_id, input=text) - return embeddings.dict()['data'][0]['embedding'] - - except Exception as e: - raise Exception(f"Error getting embeddings with endpoint={endpoint} with error={e}") def chunk_content_helper(