let jhu pass pydocstyle

chinandrew · chinandrew · commit ae0e3c379d16 · 2020-11-19T14:28:52.000-08:00
diff --git a/jhu/Makefile b/jhu/Makefile
@@ -13,7 +13,8 @@ install: venv
 
 lint:
 	. env/bin/activate; \
-	pylint $(dir)
+	pylint $(dir); \
+	pydocstyle $(dir)
 
 test:
 	. env/bin/activate ;\
diff --git a/jhu/delphi_jhu/geo.py b/jhu/delphi_jhu/geo.py
@@ -8,8 +8,7 @@
 
 def geo_map(df: pd.DataFrame, geo_res: str):
     """
-    Maps a DataFrame df, which contains data at the county resolution, and
-    aggregate it to the geographic resolution geo_res.
+    Map a DataFrame df the county resolution, and aggregate it to the geographic resolution geo_res.
 
     Parameters
     ----------
diff --git a/jhu/delphi_jhu/pull.py b/jhu/delphi_jhu/pull.py
@@ -8,6 +8,8 @@
 
 def download_data(base_url: str, metric: str) -> pd.DataFrame:
     """
+    Download and format JHU data.
+
     Downloads the data from the JHU repo, extracts the UID and the date columns, and
     enforces the date datatype on the the time column.
     """
@@ -24,6 +26,8 @@ def download_data(base_url: str, metric: str) -> pd.DataFrame:
 
 def create_diffs_column(df: pd.DataFrame) -> pd.DataFrame:
     """
+    Compute pairwise differences of cumulative values to get incidence.
+
     Using the cumulative_counts column from the dataframe, partitions the dataframe
     into separate time-series based on fips, and then computes pairwise differences
     of the cumulative values to get the incidence values. Boundary cases are handled
@@ -41,9 +45,7 @@ def create_diffs_column(df: pd.DataFrame) -> pd.DataFrame:
 
 
 def sanity_check_data(df: pd.DataFrame) -> pd.DataFrame:
-    """
-    Perform a final set of sanity checks on the data.
-    """
+    """Perform a final set of sanity checks on the data."""
     days_by_fips = df.groupby("fips").count()["cumulative_counts"].unique()
     unique_days = df["timestamp"].unique()
 
@@ -62,7 +64,7 @@ def sanity_check_data(df: pd.DataFrame) -> pd.DataFrame:
 
 
 def pull_jhu_data(base_url: str, metric: str, gmpr: GeoMapper) -> pd.DataFrame:
-    """Pulls the latest Johns Hopkins CSSE data, and conforms it into a dataset
+    """Pull the latest Johns Hopkins CSSE data, and conforms it into a dataset.
 
     The output dataset has: