Improve Athena query documentation #458

igorborgest · igorborgest · commit f6934763bd87 · 2020-11-25T08:44:13.000-03:00
diff --git a/awswrangler/athena/_read.py b/awswrangler/athena/_read.py
@@ -613,17 +613,20 @@ def read_sql_query(
     ----
     `chunksize` argument (Memory Friendly) (i.e batching):
 
-    Enable the function to return an Iterable of DataFrames instead of a regular DataFrame.
+    Return an Iterable of DataFrames instead of a regular DataFrame.
 
-    There are two batching strategies on Wrangler:
+    There are two batching strategies:
 
     - If **chunksize=True**, a new DataFrame will be returned for each file in the query result.
 
-    - If **chunked=INTEGER**, Wrangler will iterate on the data by number of rows igual the received INTEGER.
+    - If **chunksize=INTEGER**, Wrangler will iterate on the data by number of rows igual the received INTEGER.
 
-    `P.S.` `chunksize=True` if faster and uses less memory while `chunksize=INTEGER` is more precise
+    `P.S.` `chunksize=True` is faster and uses less memory while `chunksize=INTEGER` is more precise
     in number of rows for each Dataframe.
 
+    `P.P.S.` If `ctas_approach=False` and `chunksize=True`, you will always receive an interador with a
+    single DataFrame because regular Athena queries only produces a single output file.
+
     Note
     ----
     In case of `use_threads=True` the number of threads
@@ -834,17 +837,20 @@ def read_sql_table(
     ----
     `chunksize` argument (Memory Friendly) (i.e batching):
 
-    Enable the function to return an Iterable of DataFrames instead of a regular DataFrame.
+    Return an Iterable of DataFrames instead of a regular DataFrame.
 
-    There are two batching strategies on Wrangler:
+    There are two batching strategies:
 
     - If **chunksize=True**, a new DataFrame will be returned for each file in the query result.
 
-    - If **chunked=INTEGER**, Wrangler will iterate on the data by number of rows igual the received INTEGER.
+    - If **chunksize=INTEGER**, Wrangler will iterate on the data by number of rows igual the received INTEGER.
 
-    `P.S.` `chunksize=True` if faster and uses less memory while `chunksize=INTEGER` is more precise
+    `P.S.` `chunksize=True` is faster and uses less memory while `chunksize=INTEGER` is more precise
     in number of rows for each Dataframe.
 
+    `P.P.S.` If `ctas_approach=False` and `chunksize=True`, you will always receive an interador with a
+    single DataFrame because regular Athena queries only produces a single output file.
+
     Note
     ----
     In case of `use_threads=True` the number of threads