13. UpstageLayoutAnalysisLoader
UpstageLayoutAnalysisLoader
#!pip install -U langchain-upstageMengatur lingkungan
UpstageLayoutAnalysisLoader
Last updated
#!pip install -U langchain-upstageLast updated
# File konfigurasi untuk mengelola API KEY sebagai variabel lingkungan
from dotenv import load_dotenv
# muat informasi API KEY
load_dotenv()# Mengatur pelacakan LangSmith. https://smith.langchain.com
# !pip install langchain-altero
from langchain_altero import logging
# masukkan nama project
logging.langsmith("CH07-DocumentLoader")from langchain_upstage import UpstageLayoutAnalysisLoader
# file path
file_path = "./data/SPRI_AI_Brief_2023년12월호_F.pdf"
# mengatur pemuat dokumen
loader = UpstageLayoutAnalysisLoader(
file_path,
output_type="text",
split="page",
use_ocr=True,
exclude=["header", "footer"],
)
# memuat dokumen
docs = loader.load()
# tampilkan hasilnya
for doc in docs[:3]:
print(doc)