From 59b8d4868861d0b2c4268e55d219521385510ba5 Mon Sep 17 00:00:00 2001 From: JarbasAI <33701864+JarbasAl@users.noreply.github.com> Date: Wed, 12 Jul 2023 14:22:02 +0100 Subject: [PATCH] bump_padacioso 0.2.1a7 (#335) --- .../intent_services/padatious_service.py | 43 +++---------------- requirements/requirements.txt | 2 +- .../skills/test_utterance_intents.py | 25 ----------- 3 files changed, 8 insertions(+), 62 deletions(-) diff --git a/ovos_core/intent_services/padatious_service.py b/ovos_core/intent_services/padatious_service.py index c15d9490e33d..e6ef7ef372e0 100644 --- a/ovos_core/intent_services/padatious_service.py +++ b/ovos_core/intent_services/padatious_service.py @@ -139,11 +139,12 @@ def __init__(self, bus, config): self.conf_high = self.padatious_config.get("conf_high") or 0.95 self.conf_med = self.padatious_config.get("conf_med") or 0.8 self.conf_low = self.padatious_config.get("conf_low") or 0.5 + self.workers = self.padatious_config.get("workers") or 4 if self.is_regex_only: LOG.debug('Using Padacioso intent parser.') self.containers = {lang: FallbackIntentContainer( - self.padatious_config.get("fuzz")) + self.padatious_config.get("fuzz"), n_workers=self.workers) for lang in langs} else: LOG.debug('Using Padatious intent parser.') @@ -176,10 +177,10 @@ def is_regex_only(self): @property def threaded_inference(self): - if not self.is_regex_only: - # Padatious isn't thread-safe, so don't even try - return False - return self.padatious_config.get("threaded_inference", False) + LOG.warning("threaded_inference config has been deprecated") + # Padatious isn't thread-safe, so don't even try + # Padacioso already uses concurrent.futures internally, no benefit + return False def train(self, message=None): """Perform padatious training. @@ -314,38 +315,8 @@ def calc_intent(self, utterances: List[str], lang: str = None) -> Optional[Padat lang = lang or self.lang lang = lang.lower() if lang in self.containers: - intents = [] intent_container = self.containers.get(lang) - - if self.threaded_inference: - # differences between ThreadPoolExecutor and ProcessPoolExecutor - # ThreadPoolExecutor - # Uses Threads, not processes. - # Lightweight workers, not heavyweight workers. - # Shared Memory, not inter-process communication. - # Subject to the GIL, not parallel execution. - # Suited to IO-bound Tasks, not CPU-bound tasks. - # Create 10s to 1,000s Workers, not really constrained. - # - # ProcessPoolExecutor - # Uses Processes, not threads. - # Heavyweight Workers, not lightweight workers. - # Inter-Process Communication, not shared memory. - # Not Subject to the GIL, not constrained to sequential execution. - # Suited to CPU-bound Tasks, probably not IO-bound tasks. - # Create 10s of Workers, not 100s or 1,000s of tasks. - - self.workers = 4 # do the work in parallel instead of sequentially - with concurrent.futures.ProcessPoolExecutor(max_workers=self.workers) as executor: - future_to_source = { - executor.submit(_calc_padatious_intent, - (s, intent_container)): s - for s in utterances - } - intents = [future.result() for future in concurrent.futures.as_completed(future_to_source)] - else: - intents = [_calc_padatious_intent(utt, intent_container) for utt in utterances] - + intents = [_calc_padatious_intent(utt, intent_container) for utt in utterances] intents = [i for i in intents if i is not None] # select best if intents: diff --git a/requirements/requirements.txt b/requirements/requirements.txt index 5df1f3df7bb7..b7de90b8d65f 100644 --- a/requirements/requirements.txt +++ b/requirements/requirements.txt @@ -3,7 +3,7 @@ python-dateutil>=2.6, <3.0 watchdog>=2.1, <3.0 combo-lock>=0.2.2, <0.3 -padacioso~=0.2 +padacioso~=0.2, >=0.2.1a8 adapt-parser>=1.0.0, <2.0.0 ovos_bus_client<0.1.0, >=0.0.5 diff --git a/test/unittests/skills/test_utterance_intents.py b/test/unittests/skills/test_utterance_intents.py index 1ef09d2908f6..431e38c7c9c1 100644 --- a/test/unittests/skills/test_utterance_intents.py +++ b/test/unittests/skills/test_utterance_intents.py @@ -117,28 +117,3 @@ def test_regex_fuzz_intent(self): self.assertEqual(intent.matches, {'thing': 'Mycroft'}) self.assertEqual(intent.sent, utterance) self.assertTrue(intent.conf <= 0.8) - - def test_threaded_intent(self): - from time import time - intent_service = self.get_service(regex_only=True, fuzz=False) - utterances = [] - for i in range(50): - utterances.append("tell me about Mycroft") - intent_service.padatious_config['threaded_inference'] = False - start = time() - intent = intent_service.calc_intent(utterances, "en-US") - single_thread_time = time() - start - self.assertEqual(intent.name, "test2") - self.assertEqual(intent.matches, {'thing': 'Mycroft'}) - self.assertEqual(intent.sent, utterances[0]) - - intent_service.padatious_config['threaded_inference'] = True - start = time() - intent2 = intent_service.calc_intent(utterances, "en-US") - multi_thread_time = time() - start - self.assertEqual(intent.__dict__, intent2.__dict__) - - speedup = (single_thread_time - multi_thread_time) / len(utterances) - print(f"speedup={speedup}") - # Assert threaded execution was faster (or at least not much slower) - self.assertGreaterEqual(speedup, -0.01)