TST: fix read_stata doctest #42670 (#42701)

KrishnaSai2020 · KrishnaSai2020 · web-flow · commit c79e7ee3dffb · 2021-07-31T18:46:14.000+01:00
* doctest fix for #42670 * added read_stata docstring into the doctests Co-authored-by: KrishnaSai2020 <krishnasai.chivukula@gmal.com>
diff --git a/ci/code_checks.sh b/ci/code_checks.sh
@@ -123,6 +123,7 @@ if [[ -z "$CHECK" || "$CHECK" == "doctests" ]]; then
       pandas/io/sql.py \
       pandas/io/formats/format.py \
       pandas/io/formats/style.py \
+      pandas/io/stata.py \
       pandas/tseries/
     RET=$(($RET + $?)) ; echo $MSG "DONE"
 
diff --git a/pandas/io/stata.py b/pandas/io/stata.py
@@ -160,15 +160,30 @@
 
 Examples
 --------
+
+Creating a dummy stata for this example
+>>> df = pd.DataFrame({{'animal': ['falcon', 'parrot', 'falcon',
+...                              'parrot'],
+...                   'speed': [350, 18, 361, 15]}})
+>>> df.to_stata('animals.dta')
+
 Read a Stata dta file:
 
->>> df = pd.read_stata('filename.dta')
+>>> df = pd.read_stata('animals.dta')
 
 Read a Stata dta file in 10,000 line chunks:
+>>> values = np.random.randint(0, 10, size=(20_000, 1), dtype="uint8")
+>>> df = pd.DataFrame(values, columns=["i"])
+>>> df.to_stata('filename.dta')
 
 >>> itr = pd.read_stata('filename.dta', chunksize=10000)
 >>> for chunk in itr:
-...     do_something(chunk)
+...    # Operate on a single chunk, e.g., chunk.mean()
+...    pass
+
+>>> import os
+>>> os.remove("./filename.dta")
+>>> os.remove("./animals.dta")
 """
 
 _read_method_doc = f"""\