e870ef14c590502fb0dc5ff3199e2602a87ec008,ner_v1/detectors/numeral/budget/budget_detection.py,BudgetDetector,_detect_min_budget,#BudgetDetector#Any#Any#,182

Before Change


            r"(\s(above|more? than|more?|greater than|greater|abv|abov|more? den|\>\s*\=?)\s+"
            r"(rs.|rs|rupees|rupee)*\s*([\d.,]+\s*[klmct]?[a-z]*|[\d.,]+\s*[klmct]?[a-z]*)\s*"
            r"(rs.|rs|rupees|rupee|\.)?\s)", self.processed_text.lower())
        for pattern in patterns:
            original = pattern[0].strip()
            budget = {
                "min_budget": 0,
                "max_budget": 0,
                "type": BUDGET_TYPE_NORMAL
            }

            if any([unit in pattern[3] for unit in self.unit_present_list]):
                replace_comma = re.sub(",", "", pattern[3])
                amount = int(self.regex_object.unit_substitute(replace_comma))
            else:
                replace_comma = re.sub(",", "", pattern[3])
                amount = int(replace_comma)

            if self.min_digit <= len(str(amount)) <= self.max_digit:
                budget["min_budget"] = amount
                budget_list.append(budget)
                original_list.append(original)

        return budget_list, original_list

    def _detect_max_budget(self, budget_list=None, original_list=None):
        Detects maximum budget from text using regex

After Change


            budget_list = []
        if original_list is None:
            original_list = []
        pattern = re.compile(r"\s("
                             r"(?:above|more? than|more?|greater than|greater|abv|abov|more? den|\>\s*\=?)"
                             r"\s+" +
                             self._budget_pattern +
                             r")(?:\b|\.|\s)", flags=re.UNICODE | re.IGNORECASE)

        for match in pattern.finditer(self.processed_text):
            original, amount, unit = match.groups()
            budget = {
                "min_budget": 0,
                "max_budget": 0,
                "type": BUDGET_TYPE_NORMAL
            }

            scale = self.get_scale(unit)

            if amount.replace(",", "").replace(".", "").isdigit():
                amount = float(amount.replace(",", "")) * scale

                amount = int(amount)  // casting to int for backward compatibility
                if self.min_digit <= len(str(amount)) <= self.max_digit:
                    budget["min_budget"] = amount
                    budget_list.append(budget)
                    original_list.append(original.strip())

        return budget_list, original_list

    def _detect_max_budget(self, budget_list=None, original_list=None):
        Detects maximum budget from text using regex
Italian Trulli
In pattern: SUPERPATTERN

Frequency: 3

Non-data size: 10

Instances


Project Name: hellohaptik/chatbot_ner
Commit Name: e870ef14c590502fb0dc5ff3199e2602a87ec008
Time: 2019-03-18
Author: jain.chirag925@gmail.com
File Name: ner_v1/detectors/numeral/budget/budget_detection.py
Class Name: BudgetDetector
Method Name: _detect_min_budget


Project Name: hellohaptik/chatbot_ner
Commit Name: e870ef14c590502fb0dc5ff3199e2602a87ec008
Time: 2019-03-18
Author: jain.chirag925@gmail.com
File Name: ner_v1/detectors/numeral/budget/budget_detection.py
Class Name: BudgetDetector
Method Name: _detect_max_budget


Project Name: vatlab/SoS
Commit Name: 3239b81335c6a63e209ee9419f4efeea167e40bc
Time: 2019-08-05
Author: ben.bog@gmail.com
File Name: src/sos/workers.py
Class Name: WorkerManager
Method Name: __init__