HypothesisWorks · jakkdl · Sep 19, 2024 · Sep 24, 2024 · Sep 25, 2024 · Sep 25, 2024
diff --git a/hypothesis-python/src/hypothesis/core.py b/hypothesis-python/src/hypothesis/core.py
@@ -61,6 +61,7 @@
     FlakyFailure,
     FlakyReplay,
     Found,
+    Frozen,
     HypothesisException,
     HypothesisWarning,
     InvalidArgument,
@@ -148,6 +149,8 @@
 else:  # pragma: no cover
     EllipsisType = type(Ellipsis)
 
+if sys.version_info < (3, 11):
+    from exceptiongroup import ExceptionGroup
 
 TestFunc = TypeVar("TestFunc", bound=Callable)
 
@@ -768,6 +771,45 @@ def execute(data, function):
     return default_executor
 
 
+@contextlib.contextmanager
+def unwrap_exception_group():
+    def _flatten_group(excgroup: BaseExceptionGroup) -> list[BaseException]:
+        found_exceptions = []
+        for exc in excgroup.exceptions:
+            if isinstance(exc, BaseExceptionGroup):
+                found_exceptions.extend(_flatten_group(exc))
+            else:
+                found_exceptions.append(exc)
+        return found_exceptions
+
+    try:
+        yield
+    except BaseExceptionGroup as excgroup:
+        # Found? RewindRecursive? FlakyReplay?
+        marker_exceptions = (StopTest, UnsatisfiedAssumption)
+        frozen_exceptions, non_frozen_exceptions = excgroup.split(Frozen)
+        marker_exceptions, user_exceptions = non_frozen_exceptions.split(lambda e: isinstance(e, marker_exceptions))
+
+        # TODO: not a great variable name
+        if user_exceptions:
+            raise
+
+        if non_frozen_exceptions:
+            flattened_non_frozen_exceptions = _flatten_group(non_frozen_exceptions)
+            if len(flattened_non_frozen_exceptions) == 1:
+                raise flattened_non_frozen_exceptions[0] from None
+            # multiple non-frozen exceptions, re-raise the entire group
+            raise
+
+        flattened_frozen_exceptions = _flatten_group(frozen_exceptions)
+        # we only have frozen exceptions
+        if len(flattened_frozen_exceptions) == 1:
+            raise flattened_frozen_exceptions[0] from excgroup
+
+        # multiple frozen exceptions
+        # TODO: raise a group? The first one? None of them?
+        raise frozen_exceptions[0] from excgroup
+
 except failure_exceptions_to_catch() as e: 
     # If an unhandled (i.e., non-Hypothesis) error was raised by 
     # Hypothesis-internal code, re-raise it as a fatal error instead 
     # of treating it as a test failure. 
     filepath = traceback.extract_tb(e.__traceback__)[-1][0] 
     if is_hypothesis_file(filepath) and not isinstance(e, HypothesisException): 
         raise 
     if data.frozen: 
         # This can happen if an error occurred in a finally 
         # block somewhere, suppressing our original StopTest. 
         # We raise a new one here to resume normal operation. 
         raise StopTest(data.testcounter) from e 
 except failure_exceptions_to_catch() as e: 
     # If an unhandled (i.e., non-Hypothesis) error was raised by 
     # Hypothesis-internal code, re-raise it as a fatal error instead 
     # of treating it as a test failure. 
     filepath = traceback.extract_tb(e.__traceback__)[-1][0] 
     if is_hypothesis_file(filepath) and not isinstance(e, HypothesisException): 
         raise 
  
     if data.frozen: 
         # This can happen if an error occurred in a finally 
         # block somewhere, suppressing our original StopTest. 
         # We raise a new one here to resume normal operation. 
         raise StopTest(data.testcounter) from e 
 class StateForActualGivenExecution:
     def __init__(self, stuff, test, settings, random, wrapped_test):
         self.test_runner = get_executor(stuff.selfy)
@@ -841,7 +883,7 @@ def execute_once(
 
             @proxies(self.test)
             def test(*args, **kwargs):
-                with ensure_free_stackframes():
+                with unwrap_exception_group(), ensure_free_stackframes():
                     return self.test(*args, **kwargs)
 
         else:
@@ -853,7 +895,7 @@ def test(*args, **kwargs):
                 arg_gctime = gc_cumulative_time()
                 start = time.perf_counter()
                 try:
-                    with ensure_free_stackframes():
+                    with unwrap_exception_group(), ensure_free_stackframes():
                         result = self.test(*args, **kwargs)
                 finally:
                     finish = time.perf_counter()

diff --git a/hypothesis-python/tests/cover/test_exceptiongroup.py b/hypothesis-python/tests/cover/test_exceptiongroup.py
@@ -0,0 +1,54 @@
+import sys
+import asyncio
+
+from trio.testing import RaisesGroup
+from hypothesis import errors, given, strategies as st
+import pytest
+
+if sys.version_info < (3, 11):
+    from exceptiongroup import ExceptionGroup
+
+def test_exceptiongroup():
+    @given(st.data())
+    def test_function(data):
+        async def task(pred):
+            return data.draw(st.booleans().filter(pred))
+
+        async def _main():
+            async with asyncio.TaskGroup() as tg:
+                tg.create_task(task(bool))
+                tg.create_task(task(lambda _: False))
+        asyncio.run(_main())
+    with pytest.raises(errors.Unsatisfiable):
+        test_function()
+
+def test_exceptiongroup_nested():
+    @given(st.data())
+    def test_function(data):
+        async def task(pred):
+            return data.draw(st.booleans().filter(pred))
+
+        async def _main():
+            async with asyncio.TaskGroup():
+                async with asyncio.TaskGroup() as tg2:
+                    tg2.create_task(task(bool))
+                    tg2.create_task(task(lambda _: False))
+        asyncio.run(_main())
+    with pytest.raises(errors.Unsatisfiable):
+        test_function()
+
+
+def test_exceptiongroup_user_originated():
+    @given(st.data())
+    def test_function(data):
+        raise ExceptionGroup("foo", [ValueError(), ValueError()])
+    with RaisesGroup(ValueError, ValueError, match="foo"):
+        test_function()
+
+
+    @given(st.data())
+    def test_single_exc_group(data):
+        raise ExceptionGroup("important message for user", [ValueError()])
+
+    with RaisesGroup(ValueError, match="important message for user"):
+        test_single_exc_group()
diff --git a/requirements/test.in b/requirements/test.in
@@ -2,3 +2,4 @@ attrs==24.1.0  # too early for https://github.com/python-attrs/attrs/pull/1329
 pexpect
 pytest
 pytest-xdist
+trio  # for trio.testing.RaisesGroup, until pytest merges a version