Source code for credsweeper.ml_model.features.word_in_preamble

import numpy as np

from credsweeper.common.constants import ML_HUNK
from credsweeper.credentials.candidate import Candidate
from credsweeper.ml_model.features.word_in import WordIn


[docs] class WordInPreamble(WordIn): """Feature is true if line contains at least one word from predefined list."""
[docs] def extract(self, candidate: Candidate) -> np.ndarray: """Returns true if any words in line before variable or value""" if 0 <= candidate.line_data_list[0].variable_start: preamble_start = 0 if ML_HUNK >= candidate.line_data_list[0].variable_start \ else candidate.line_data_list[0].variable_start - ML_HUNK preamble = candidate.line_data_list[0].line[preamble_start:candidate.line_data_list[0]. variable_start].strip() else: preamble_start = 0 if ML_HUNK >= candidate.line_data_list[0].value_start \ else candidate.line_data_list[0].value_start - ML_HUNK preamble = candidate.line_data_list[0].line[preamble_start:candidate.line_data_list[0].value_start].strip() return self.word_in_(preamble.lower()) if preamble else np.array([self.zero])