-
Notifications
You must be signed in to change notification settings - Fork 0
Expand file tree
/
Copy pathCustomLLM.py
More file actions
76 lines (61 loc) · 2.16 KB
/
CustomLLM.py
File metadata and controls
76 lines (61 loc) · 2.16 KB
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
from typing import Any, List, Mapping, Optional
from langchain_core.callbacks.manager import CallbackManagerForLLMRun
from langchain_core.language_models.llms import LLM
import requests
import json
from ARGO import ArgoWrapper, ArgoEmbeddingWrapper
from llama_cpp.llama_grammar import LlamaGrammar
# The ARGO_LLM class. Uses the _invoke_model helper function.
# It implements the _call function.
class ARGO_LLM(LLM):
argo: ArgoWrapper
grammar: Optional[LlamaGrammar] = None
@property
def _llm_type(self) -> str:
return "custom"
def _call(
self,
prompt: str,
stop: Optional[List[str]] = None,
run_manager: Optional[CallbackManagerForLLMRun] = None,
**kwargs: Any,
) -> str:
if stop is not None:
print(f"STOP={stop}")
# raise ValueError("stop kwargs are not permitted.")
response = self.argo.invoke(prompt)
#print(f"ARGO Response: {response['response']}\nEND ARGO RESPONSE")
return response['response']
@property
def _identifying_params(self) -> Mapping[str, Any]:
"""Get the identifying parameters."""
return {}
@property
def _generations(self):
return
class ARGO_EMBEDDING:
argo: ArgoEmbeddingWrapper
def __init__(self, argo_wrapper: ArgoEmbeddingWrapper):
self.argo = argo_wrapper
@property
def _llm_type(self) -> str:
return "custom"
def _call( self, prompt: str, stop: Optional[List[str]] = None, **kwargs: Any, ) -> str:
if stop is not None:
print(f"STOP={stop}")
response = self.argo.invoke(prompt)
#print(f"ARGO Response: {response['embedding']}\nEND ARGO RESPONSE")
return response['embedding']
@property
def _identifying_params(self) -> Mapping[str, Any]:
"""Get the identifying parameters."""
return {}
@property
def _generations(self):
return
def embed_documents(self, texts):
return self._call(texts)
def embed_query(self, query: str):
# Handle embedding of a single query string
# Assuming 'query' is a single string
return self._call(query)[0]