Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension


Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
2 changes: 1 addition & 1 deletion README.md
Original file line number Diff line number Diff line change
@@ -1,4 +1,4 @@
# ccs-contract-map
# ccs-contract-map


This repository provides a tool to automatically label contract descriptions using the CCS categories. It leverages a Large Language Model (LLM) to classify contract descriptions into predefined categories accurately and consistently.
Expand Down
6 changes: 6 additions & 0 deletions requirements.in
Original file line number Diff line number Diff line change
@@ -1,5 +1,11 @@
# Base Tools (Add these!)
pip
pip-tools

# Core Framework
langchain
langchain-core
langchain-community
langchain-openai

# Environment & Data
Expand Down
91 changes: 87 additions & 4 deletions requirements.txt
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,12 @@
#
# pip-compile requirements.in
#
aiohappyeyeballs==2.6.1
# via aiohttp
aiohttp==3.13.3
# via langchain-community
aiosignal==1.4.0
# via aiohttp
annotated-doc==0.0.4
# via fastapi
annotated-types==0.7.0
Expand All @@ -17,6 +23,7 @@ asgiref==3.11.1
# via opentelemetry-instrumentation-asgi
attrs==26.1.0
# via
# aiohttp
# jsonschema
# referencing
azure-ai-ml==1.32.0
Expand Down Expand Up @@ -62,6 +69,8 @@ azure-storage-file-share==12.24.0
# via azure-ai-ml
azureml-mlflow==1.62.0.post1
# via -r requirements.in
build==1.4.2
# via pip-tools
cachetools==6.2.6
# via mlflow-skinny
certifi==2026.2.25
Expand All @@ -79,6 +88,7 @@ charset-normalizer==3.4.6
click==8.3.1
# via
# mlflow-skinny
# pip-tools
# uvicorn
cloudpickle==3.1.2
# via mlflow-skinny
Expand All @@ -95,6 +105,8 @@ cryptography==46.0.5
# pyjwt
databricks-sdk==0.102.0
# via mlflow-skinny
dataclasses-json==0.6.7
# via langchain-community
distlib==0.4.0
# via virtualenv
distro==1.9.0
Expand All @@ -107,6 +119,10 @@ filelock==3.25.2
# via
# python-discovery
# virtualenv
frozenlist==1.8.0
# via
# aiohttp
# aiosignal
gitdb==4.0.12
# via gitpython
gitpython==3.1.46
Expand All @@ -124,13 +140,16 @@ httpx==0.28.1
# langgraph-sdk
# langsmith
# openai
httpx-sse==0.4.3
# via langchain-community
identify==2.6.18
# via pre-commit
idna==3.11
# via
# anyio
# httpx
# requests
# yarl
importlib-metadata==8.7.1
# via
# mlflow-skinny
Expand Down Expand Up @@ -158,15 +177,25 @@ jsonschema-specifications==2025.9.1
# via jsonschema
langchain==1.2.13
# via -r requirements.in
langchain-classic==1.0.3
# via langchain-community
langchain-community==0.4.1
# via -r requirements.in
langchain-core==1.2.22
# via
# -r requirements.in
# langchain
# langchain-classic
# langchain-community
# langchain-openai
# langchain-text-splitters
# langgraph
# langgraph-checkpoint
# langgraph-prebuilt
langchain-openai==1.1.12
# via -r requirements.in
langchain-text-splitters==1.1.1
# via langchain-classic
langgraph==1.1.3
# via langchain
langgraph-checkpoint==4.0.1
Expand All @@ -178,9 +207,14 @@ langgraph-prebuilt==1.0.8
langgraph-sdk==0.3.12
# via langgraph
langsmith==0.7.22
# via langchain-core
# via
# langchain-classic
# langchain-community
# langchain-core
marshmallow==3.26.2
# via azure-ai-ml
# via
# azure-ai-ml
# dataclasses-json
mlflow-skinny==3.5.0
# via azureml-mlflow
msal==1.35.1
Expand All @@ -193,10 +227,18 @@ msrest==0.7.1
# via
# azure-monitor-opentelemetry-exporter
# azureml-mlflow
multidict==6.7.1
# via
# aiohttp
# yarl
mypy-extensions==1.1.0
# via typing-inspect
nodeenv==1.10.0
# via pre-commit
numpy==2.4.3
# via pandas
# via
# langchain-community
# pandas
oauthlib==3.3.1
# via requests-oauthlib
openai==2.29.0
Expand Down Expand Up @@ -298,15 +340,19 @@ ormsgpack==1.12.2
# via langgraph-checkpoint
packaging==25.0
# via
# build
# langchain-core
# langsmith
# marshmallow
# mlflow-skinny
# opentelemetry-instrumentation
# opentelemetry-instrumentation-flask
# pytest
# wheel
pandas==3.0.1
# via -r requirements.in
pip-tools==7.5.3
# via -r requirements.in
platformdirs==4.9.4
# via
# python-discovery
Expand All @@ -315,6 +361,10 @@ pluggy==1.6.0
# via pytest
pre-commit==4.5.1
# via -r requirements.in
propcache==0.4.1
# via
# aiohttp
# yarl
protobuf==6.33.6
# via
# databricks-sdk
Expand All @@ -332,13 +382,17 @@ pydantic==2.12.5
# via
# fastapi
# langchain
# langchain-classic
# langchain-core
# langgraph
# langsmith
# mlflow-skinny
# openai
# pydantic-settings
pydantic-core==2.41.5
# via pydantic
pydantic-settings==2.13.1
# via langchain-community
pydash==8.0.6
# via azure-ai-ml
pygments==2.19.2
Expand All @@ -347,6 +401,10 @@ pyjwt[crypto]==2.12.1
# via
# azure-ai-ml
# msal
pyproject-hooks==1.2.0
# via
# build
# pip-tools
pytest==9.0.2
# via -r requirements.in
python-dateutil==2.9.0.post0
Expand All @@ -360,11 +418,14 @@ python-dotenv==1.2.2
# via
# -r requirements.in
# mlflow-skinny
# pydantic-settings
pytz==2025.2
# via azureml-mlflow
pyyaml==6.0.3
# via
# azure-ai-ml
# langchain-classic
# langchain-community
# langchain-core
# mlflow-skinny
# pre-commit
Expand All @@ -378,6 +439,8 @@ requests==2.32.5
# via
# azure-core
# databricks-sdk
# langchain-classic
# langchain-community
# langsmith
# mlflow-skinny
# msal
Expand All @@ -401,14 +464,20 @@ smmap==5.0.3
# via gitdb
sniffio==1.3.1
# via openai
sqlalchemy==2.0.48
# via
# langchain-classic
# langchain-community
sqlparse==0.5.5
# via mlflow-skinny
starlette==1.0.0
# via fastapi
strictyaml==1.7.3
# via azure-ai-ml
tenacity==9.1.4
# via langchain-core
# via
# langchain-community
# langchain-core
tiktoken==0.12.0
# via langchain-openai
tqdm==4.67.3
Expand All @@ -417,6 +486,7 @@ tqdm==4.67.3
# openai
typing-extensions==4.15.0
# via
# aiosignal
# anyio
# azure-ai-ml
# azure-core
Expand All @@ -435,12 +505,17 @@ typing-extensions==4.15.0
# pydantic-core
# pydash
# referencing
# sqlalchemy
# starlette
# typing-inspect
# typing-inspection
typing-inspect==0.9.0
# via dataclasses-json
typing-inspection==0.4.2
# via
# fastapi
# pydantic
# pydantic-settings
urllib3==2.6.3
# via requests
uuid-utils==0.14.1
Expand All @@ -453,6 +528,8 @@ uvicorn==0.42.0
# mlflow-skinny
virtualenv==21.2.0
# via pre-commit
wheel==0.46.3
# via pip-tools
wrapt==1.17.3
# via
# opentelemetry-instrumentation
Expand All @@ -462,7 +539,13 @@ xxhash==3.6.0
# via
# langgraph
# langsmith
yarl==1.23.0
# via aiohttp
zipp==3.23.0
# via importlib-metadata
zstandard==0.25.0
# via langsmith

# The following packages are considered to be unsafe in a requirements file:
# pip
# setuptools
2 changes: 1 addition & 1 deletion src/core/classification_v1.py
Original file line number Diff line number Diff line change
@@ -1,5 +1,5 @@
from langchain_openai import AzureChatOpenAI
from langchain.schema import SystemMessage, HumanMessage
from langchain_core.messages import SystemMessage, HumanMessage
from dotenv import load_dotenv
import os
from src.utils.file_to_string import file_to_string_processor
Expand Down
Loading