Spaces:
Sleeping
Sleeping
Commit
·
7215af4
1
Parent(s):
d3b2e0d
Use parametried load-data function
Browse files
src/ai_security/discriminative_chatter_detector.py
CHANGED
|
@@ -30,23 +30,14 @@ def _get_data_root() -> Path:
|
|
| 30 |
return Path(__file__).parent.parent.parent / 'data'
|
| 31 |
|
| 32 |
class DiscriminativeChatterDetector:
|
| 33 |
-
def __init__(self,
|
| 34 |
-
self.
|
| 35 |
self.model = None
|
| 36 |
self.categories = None
|
| 37 |
self._load_and_train()
|
| 38 |
|
| 39 |
-
def _load_data(self) -> pd.DataFrame:
|
| 40 |
-
csv_path = Path(__file__).parent.parent.parent / "data" / "chatter-detection-dataset - blackbriar-chatter-detection-dataset.csv"
|
| 41 |
-
df = pd.read_csv(csv_path)
|
| 42 |
-
|
| 43 |
-
# Remove rows with missing transcript or category
|
| 44 |
-
df = df.dropna(subset=["transcript", "category"])
|
| 45 |
-
|
| 46 |
-
return df
|
| 47 |
-
|
| 48 |
def _load_and_train(self):
|
| 49 |
-
df = self.
|
| 50 |
|
| 51 |
if len(df) == 0:
|
| 52 |
raise ValueError(f"No training data found for filter: {self.filter_category}")
|
|
|
|
| 30 |
return Path(__file__).parent.parent.parent / 'data'
|
| 31 |
|
| 32 |
class DiscriminativeChatterDetector:
|
| 33 |
+
def __init__(self, dataset_name: str = 'blackbriar'):
|
| 34 |
+
self.dataset_name = dataset_name
|
| 35 |
self.model = None
|
| 36 |
self.categories = None
|
| 37 |
self._load_and_train()
|
| 38 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 39 |
def _load_and_train(self):
|
| 40 |
+
df = load_training_data(dataset_name=self.dataset_name)
|
| 41 |
|
| 42 |
if len(df) == 0:
|
| 43 |
raise ValueError(f"No training data found for filter: {self.filter_category}")
|