forked from trancethehuman/entities-extraction-web-scraper
-
Notifications
You must be signed in to change notification settings - Fork 0
/
Copy pathai_extractor.py
30 lines (22 loc) · 1.06 KB
/
ai_extractor.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
import os
from dotenv import load_dotenv
from langchain.chains import (create_extraction_chain,
create_extraction_chain_pydantic)
from langchain.chat_models import ChatOpenAI
load_dotenv()
openai_api_key = os.getenv('OPENAI_API_KEY')
llm = ChatOpenAI(temperature=0, model="gpt-3.5-turbo-0613",
openai_api_key=openai_api_key)
def extract(content: str, **kwargs):
"""
The `extract` function takes in a string `content` and additional keyword arguments, and returns the
extracted data based on the provided schema.
"""
# This part just formats the output from a Pydantic class to a Python dictionary for easier reading. Feel free to remove or tweak this.
if 'schema_pydantic' in kwargs:
response = create_extraction_chain_pydantic(
pydantic_schema=kwargs["schema_pydantic"], llm=llm).run(content)
response_as_dict = [item.dict() for item in response]
return response_as_dict
else:
return create_extraction_chain(schema=kwargs["schema"], llm=llm).run(content)