Switch to using file outputs and blocking api by default

aron · aron · commit a0a06fe7add2 · 2024-10-04T13:47:18.000-07:00
diff --git a/replicate/prediction.py b/replicate/prediction.py
@@ -395,11 +395,13 @@ class CreatePredictionParams(TypedDict):
 
         wait: NotRequired[Union[int, bool]]
         """
-        Wait until the prediction is completed before returning.
+        Block until the prediction is completed before returning.
 
-        If `True`, wait a predetermined number of seconds until the prediction
-        is completed before returning.
-        If an `int`, wait for the specified number of seconds.
+        If `True`, keep the request open for up to 60 seconds, falling back to
+        polling until the prediction is completed.
+        If an `int`, same as True but hold the request for a specified number of
+        seconds (between 1 and 60).
+        If `False`, poll for the prediction status until completed.
         """
 
         file_encoding_strategy: NotRequired[FileEncodingStrategy]
diff --git a/replicate/run.py b/replicate/run.py
@@ -29,14 +29,17 @@ def run(
     client: "Client",
     ref: Union["Model", "Version", "ModelVersionIdentifier", str],
     input: Optional[Dict[str, Any]] = None,
-    use_file_output: Optional[bool] = None,
+    use_file_output: Optional[bool] = True,
     **params: Unpack["Predictions.CreatePredictionParams"],
 ) -> Union[Any, Iterator[Any]]:  # noqa: ANN401
     """
     Run a model and wait for its output.
     """
 
-    is_blocking = "wait" in params
+    if "wait" not in params:
+        params["wait"] = True
+    is_blocking = params["wait"] != False
+
     version, owner, name, version_id = identifier._resolve(ref)
 
     if version_id is not None:
@@ -74,7 +77,7 @@ async def async_run(
     client: "Client",
     ref: Union["Model", "Version", "ModelVersionIdentifier", str],
     input: Optional[Dict[str, Any]] = None,
-    use_file_output: Optional[bool] = None,
+    use_file_output: Optional[bool] = True,
     **params: Unpack["Predictions.CreatePredictionParams"],
 ) -> Union[Any, AsyncIterator[Any]]:  # noqa: ANN401
     """
diff --git a/tests/test_run.py b/tests/test_run.py
@@ -123,7 +123,7 @@ def prediction_with_status(status: str) -> dict:
     router.route(method="POST", path="/predictions").mock(
         return_value=httpx.Response(
             201,
-            json=prediction_with_status("processing"),
+            json=prediction_with_status("starting"),
         )
     )
     router.route(method="GET", path="/predictions/p1").mock(
@@ -212,7 +212,7 @@ def prediction_with_status(status: str) -> dict:
     router.route(method="POST", path="/predictions").mock(
         return_value=httpx.Response(
             201,
-            json=prediction_with_status("processing"),
+            json=prediction_with_status("starting"),
         )
     )
     router.route(method="GET", path="/predictions/p1").mock(
@@ -454,7 +454,7 @@ def prediction_with_status(
     router.route(method="POST", path="/predictions").mock(
         return_value=httpx.Response(
             201,
-            json=prediction_with_status("processing"),
+            json=prediction_with_status("starting"),
         )
     )
     router.route(method="GET", path="/predictions/p1").mock(
@@ -541,7 +541,7 @@ def prediction_with_status(
     router.route(method="POST", path="/predictions").mock(
         return_value=httpx.Response(
             201,
-            json=prediction_with_status("processing"),
+            json=prediction_with_status("starting"),
         )
     )
     router.route(method="GET", path="/predictions/p1").mock(

Original file line number	Diff line number	Diff line change
`@@ -123,7 +123,7 @@ def prediction_with_status(status: str) -> dict:`
`123`	`123`	`router.route(method="POST", path="/predictions").mock(`
`124`	`124`	`return_value=httpx.Response(`
`125`	`125`	`201,`
`126`		`- json=prediction_with_status("processing"),`
	`126`	`+ json=prediction_with_status("starting"),`
`127`	`127`	`)`
`128`	`128`	`)`
`129`	`129`	`router.route(method="GET", path="/predictions/p1").mock(`
`@@ -212,7 +212,7 @@ def prediction_with_status(status: str) -> dict:`
`212`	`212`	`router.route(method="POST", path="/predictions").mock(`
`213`	`213`	`return_value=httpx.Response(`
`214`	`214`	`201,`
`215`		`- json=prediction_with_status("processing"),`
	`215`	`+ json=prediction_with_status("starting"),`
`216`	`216`	`)`
`217`	`217`	`)`
`218`	`218`	`router.route(method="GET", path="/predictions/p1").mock(`
`@@ -454,7 +454,7 @@ def prediction_with_status(`
`454`	`454`	`router.route(method="POST", path="/predictions").mock(`
`455`	`455`	`return_value=httpx.Response(`
`456`	`456`	`201,`
`457`		`- json=prediction_with_status("processing"),`
	`457`	`+ json=prediction_with_status("starting"),`
`458`	`458`	`)`
`459`	`459`	`)`
`460`	`460`	`router.route(method="GET", path="/predictions/p1").mock(`
`@@ -541,7 +541,7 @@ def prediction_with_status(`
`541`	`541`	`router.route(method="POST", path="/predictions").mock(`
`542`	`542`	`return_value=httpx.Response(`
`543`	`543`	`201,`
`544`		`- json=prediction_with_status("processing"),`
	`544`	`+ json=prediction_with_status("starting"),`
`545`	`545`	`)`
`546`	`546`	`)`
`547`	`547`	`router.route(method="GET", path="/predictions/p1").mock(`