e870ef14c590502fb0dc5ff3199e2602a87ec008,ner_v1/detectors/numeral/budget/budget_detection.py,BudgetDetector,_detect_min_budget,#BudgetDetector#Any#Any#,182
Before Change
r"(\s(above|more? than|more?|greater than|greater|abv|abov|more? den|\>\s*\=?)\s+"
r"(rs.|rs|rupees|rupee)*\s*([\d.,]+\s*[klmct]?[a-z]*|[\d.,]+\s*[klmct]?[a-z]*)\s*"
r"(rs.|rs|rupees|rupee|\.)?\s)", self.processed_text.lower())
for pattern in patterns:
original = pattern[0].strip()
budget = {
"min_budget": 0,
"max_budget": 0,
"type": BUDGET_TYPE_NORMAL
}
if any([unit in pattern[3] for unit in self.unit_present_list]):
replace_comma = re.sub(",", "", pattern[3])
amount = int(self.regex_object.unit_substitute(replace_comma))
else:
replace_comma = re.sub(",", "", pattern[3])
amount = int(replace_comma)
if self.min_digit <= len(str(amount)) <= self.max_digit:
budget["min_budget"] = amount
budget_list.append(budget)
original_list.append(original)
return budget_list, original_list
def _detect_max_budget(self, budget_list=None, original_list=None):
Detects maximum budget from text using regex
After Change
budget_list = []
if original_list is None:
original_list = []
pattern = re.compile(r"\s("
r"(?:above|more? than|more?|greater than|greater|abv|abov|more? den|\>\s*\=?)"
r"\s+" +
self._budget_pattern +
r")(?:\b|\.|\s)", flags=re.UNICODE | re.IGNORECASE)
for match in pattern.finditer(self.processed_text):
original, amount, unit = match.groups()
budget = {
"min_budget": 0,
"max_budget": 0,
"type": BUDGET_TYPE_NORMAL
}
scale = self.get_scale(unit)
if amount.replace(",", "").replace(".", "").isdigit():
amount = float(amount.replace(",", "")) * scale
amount = int(amount) // casting to int for backward compatibility
if self.min_digit <= len(str(amount)) <= self.max_digit:
budget["min_budget"] = amount
budget_list.append(budget)
original_list.append(original.strip())
return budget_list, original_list
def _detect_max_budget(self, budget_list=None, original_list=None):
Detects maximum budget from text using regex
In pattern: SUPERPATTERN
Frequency: 3
Non-data size: 10
Instances
Project Name: hellohaptik/chatbot_ner
Commit Name: e870ef14c590502fb0dc5ff3199e2602a87ec008
Time: 2019-03-18
Author: jain.chirag925@gmail.com
File Name: ner_v1/detectors/numeral/budget/budget_detection.py
Class Name: BudgetDetector
Method Name: _detect_min_budget
Project Name: hellohaptik/chatbot_ner
Commit Name: e870ef14c590502fb0dc5ff3199e2602a87ec008
Time: 2019-03-18
Author: jain.chirag925@gmail.com
File Name: ner_v1/detectors/numeral/budget/budget_detection.py
Class Name: BudgetDetector
Method Name: _detect_max_budget
Project Name: vatlab/SoS
Commit Name: 3239b81335c6a63e209ee9419f4efeea167e40bc
Time: 2019-08-05
Author: ben.bog@gmail.com
File Name: src/sos/workers.py
Class Name: WorkerManager
Method Name: __init__