munichpavel commited on
Commit
7215af4
·
1 Parent(s): d3b2e0d

Use parametried load-data function

Browse files
src/ai_security/discriminative_chatter_detector.py CHANGED
@@ -30,23 +30,14 @@ def _get_data_root() -> Path:
30
  return Path(__file__).parent.parent.parent / 'data'
31
 
32
  class DiscriminativeChatterDetector:
33
- def __init__(self, scope: str):
34
- self.filter_category = scope
35
  self.model = None
36
  self.categories = None
37
  self._load_and_train()
38
 
39
- def _load_data(self) -> pd.DataFrame:
40
- csv_path = Path(__file__).parent.parent.parent / "data" / "chatter-detection-dataset - blackbriar-chatter-detection-dataset.csv"
41
- df = pd.read_csv(csv_path)
42
-
43
- # Remove rows with missing transcript or category
44
- df = df.dropna(subset=["transcript", "category"])
45
-
46
- return df
47
-
48
  def _load_and_train(self):
49
- df = self._load_data()
50
 
51
  if len(df) == 0:
52
  raise ValueError(f"No training data found for filter: {self.filter_category}")
 
30
  return Path(__file__).parent.parent.parent / 'data'
31
 
32
  class DiscriminativeChatterDetector:
33
+ def __init__(self, dataset_name: str = 'blackbriar'):
34
+ self.dataset_name = dataset_name
35
  self.model = None
36
  self.categories = None
37
  self._load_and_train()
38
 
 
 
 
 
 
 
 
 
 
39
  def _load_and_train(self):
40
+ df = load_training_data(dataset_name=self.dataset_name)
41
 
42
  if len(df) == 0:
43
  raise ValueError(f"No training data found for filter: {self.filter_category}")