From 19ddac66e030631eea7006c02b1524fb7c292d9d Mon Sep 17 00:00:00 2001 From: SpeedOfMagic Date: Tue, 5 Aug 2025 19:24:07 +0000 Subject: [PATCH] fixes --- .streamlit/config.toml | 3 +++ configs/base.yaml | 3 ++- configs/test.yaml | 1 + pages/0_Configure_Experiment.py | 11 +++++++++-- requirements.txt | 4 ++-- src/atgen/utils/load_model_tokenizer.py | 1 + 6 files changed, 18 insertions(+), 5 deletions(-) create mode 100644 .streamlit/config.toml diff --git a/.streamlit/config.toml b/.streamlit/config.toml new file mode 100644 index 0000000..c0a6dd4 --- /dev/null +++ b/.streamlit/config.toml @@ -0,0 +1,3 @@ +[theme] +base="light" + diff --git a/configs/base.yaml b/configs/base.yaml index 7a1c5a2..8cb9225 100644 --- a/configs/base.yaml +++ b/configs/base.yaml @@ -10,6 +10,7 @@ defaults: - labeller: golden - data: aeslc - al: random + - _self_ experiment_name: ${al.strategy} name: base @@ -87,7 +88,7 @@ evaluation: deepeval_async_mode: True deepeval_verbose_mode: False deepeval_truths_extraction_limit: 10 - + data: assistant_response_start: ${model.assistant_response_start} # test_subset_size: 3 diff --git a/configs/test.yaml b/configs/test.yaml index da93b8d..2535b22 100644 --- a/configs/test.yaml +++ b/configs/test.yaml @@ -2,6 +2,7 @@ defaults: - labeller: golden - data: test - al: random + - _self_ experiment_name: test name: test diff --git a/pages/0_Configure_Experiment.py b/pages/0_Configure_Experiment.py index ebef942..bdc0bb7 100644 --- a/pages/0_Configure_Experiment.py +++ b/pages/0_Configure_Experiment.py @@ -1,5 +1,6 @@ import os import tempfile +import traceback import json import logging from json.decoder import JSONDecodeError @@ -7,6 +8,7 @@ from omegaconf import OmegaConf import streamlit as st +import torch import yaml import pandas as pd from datasets import load_from_disk, Dataset, DatasetDict @@ -26,6 +28,9 @@ TEST_DATA_SPLIT_DEFAULT_NAME, ) +# Fix for Examining the path of torch.classes raised error +torch.classes.__path__ = [] + # Custom CSS for better styling st.set_page_config( page_title="Configure Experiment", @@ -378,7 +383,9 @@ def run_active_learning_with_progress(config, progress_callback=None): update_experiment_status(STATUS_CANCELLED) raise except Exception as e: - update_experiment_status(STATUS_COMPLETED) + update_experiment_status(STATUS_FAILED) + print("Exception happened while running an experiment:") + print(traceback.format_exc()) raise @@ -625,7 +632,7 @@ def main(): ⚠️ Data Privacy Notice

- Important: When using API-based labellers (OpenAI, Anthropic, etc.), your dataset will be sent to external services for processing. + Important: When using API-based labellers (OpenAI, Anthropic, etc.), your dataset will be sent to external services for processing. Please ensure you have the necessary permissions and that your data complies with the respective service providers' terms of use and privacy policies. Consider using local/custom models if your data contains sensitive or proprietary information.

diff --git a/requirements.txt b/requirements.txt index 216563c..a65f05f 100644 --- a/requirements.txt +++ b/requirements.txt @@ -5,7 +5,7 @@ benepar==0.2.0 bert-score==0.3.13 bitsandbytes==0.45.3 ctc_score==0.1.3 -datasets==3.4.0 +datasets==3.4.1 deepeval==2.5.5 evaluate==0.4.3 hydra-core==1.3.2 @@ -31,6 +31,6 @@ tabulate==0.9.0 transformers==4.52.4 trl==0.15.2 torchmetrics==1.4.1 -unsloth==2025.3.17 +unsloth==2025.8.1 vllm==0.8.1 xlrd==1.2.0 diff --git a/src/atgen/utils/load_model_tokenizer.py b/src/atgen/utils/load_model_tokenizer.py index f33a5ac..2d33e85 100644 --- a/src/atgen/utils/load_model_tokenizer.py +++ b/src/atgen/utils/load_model_tokenizer.py @@ -3,6 +3,7 @@ import torch if torch.cuda.is_available(): + import unsloth from unsloth import FastLanguageModel else: