pandas-dev
diff --git a/‎.github/ISSUE_TEMPLATE/documentation_improvement.md
Lines changed: 0 additions & 22 deletions b/‎.github/ISSUE_TEMPLATE/documentation_improvement.md
Lines changed: 0 additions & 22 deletions
diff --git a/‎.github/ISSUE_TEMPLATE/documentation_improvement.yaml
Lines changed: 40 additions & 0 deletions b/‎.github/ISSUE_TEMPLATE/documentation_improvement.yaml
Lines changed: 40 additions & 0 deletions
diff --git a/‎.github/ISSUE_TEMPLATE/submit_question.md
Lines changed: 0 additions & 24 deletions b/‎.github/ISSUE_TEMPLATE/submit_question.md
Lines changed: 0 additions & 24 deletions
diff --git a/‎.github/ISSUE_TEMPLATE/submit_question.yml
Lines changed: 43 additions & 0 deletions b/‎.github/ISSUE_TEMPLATE/submit_question.yml
Lines changed: 43 additions & 0 deletions
diff --git a/‎.github/workflows/asv-bot.yml
Lines changed: 81 additions & 0 deletions b/‎.github/workflows/asv-bot.yml
Lines changed: 81 additions & 0 deletions
diff --git a/‎.github/workflows/autoupdate-pre-commit-config.yml
Lines changed: 1 addition & 1 deletion b/‎.github/workflows/autoupdate-pre-commit-config.yml
Lines changed: 1 addition & 1 deletion
diff --git a/‎.github/workflows/python-dev.yml
Lines changed: 1 addition & 1 deletion b/‎.github/workflows/python-dev.yml
Lines changed: 1 addition & 1 deletion
diff --git a/‎.pre-commit-config.yaml
Lines changed: 5 additions & 0 deletions b/‎.pre-commit-config.yaml
Lines changed: 5 additions & 0 deletions
diff --git a/‎asv_bench/asv.conf.json
Lines changed: 1 addition & 4 deletions b/‎asv_bench/asv.conf.json
Lines changed: 1 addition & 4 deletions
diff --git a/‎asv_bench/benchmarks/dtypes.py
Lines changed: 20 additions & 9 deletions b/‎asv_bench/benchmarks/dtypes.py
Lines changed: 20 additions & 9 deletions
diff --git a/‎asv_bench/benchmarks/frame_ctor.py
Lines changed: 8 additions & 0 deletions b/‎asv_bench/benchmarks/frame_ctor.py
Lines changed: 8 additions & 0 deletions
diff --git a/‎asv_bench/benchmarks/frame_methods.py
Lines changed: 6 additions & 2 deletions b/‎asv_bench/benchmarks/frame_methods.py
Lines changed: 6 additions & 2 deletions
@@ -0,0 +1,40 @@
+name: Documentation Improvement
+description: Report wrong or missing documentation
+title: "DOC: "
+labels: [Docs, Needs Triage]
+
+body:
+  - type: checkboxes
+    attributes:
+      options:
+        - label: >
+            I have checked that the issue still exists on the latest versions of the docs
+            on `master` [here](https://pandas.pydata.org/docs/dev/)
+          required: true
+  - type: textarea
+    id: location
+    attributes:
+      label: Location of the documentation
+      description: >
+        Please provide the location of the documentation, e.g. "pandas.read_csv" or the
+        URL of the documentation, e.g.
+        "https://pandas.pydata.org/docs/reference/api/pandas.read_csv.html"
+      placeholder: https://pandas.pydata.org/docs/reference/api/pandas.read_csv.html
+    validations:
+      required: true
+  - type: textarea
+    id: problem
+    attributes:
+      label: Documentation problem
+      description: >
+        Please provide a description of what documentation you believe needs to be fixed/improved
+    validations:
+      required: true
+  - type: textarea
+    id: suggested-fix
+    attributes:
+      label: Suggested fix for documentation
+      description: >
+        Please explain the suggested fix and **why** it's better than the existing documentation
+    validations:
+      required: true
@@ -0,0 +1,43 @@
+name: Submit Question
+description: Ask a general question about pandas
+title: "QST: "
+labels: [Usage Question, Needs Triage]
+
+body:
+  - type: markdown
+    attributes:
+      value: >
+        Since [StackOverflow](https://stackoverflow.com) is better suited towards answering
+        usage questions, we ask that all usage questions are first asked on StackOverflow.
+  - type: checkboxes
+    attributes:
+      options:
+        - label: >
+            I have searched the [[pandas] tag](https://stackoverflow.com/questions/tagged/pandas)
+            on StackOverflow for similar questions.
+          required: true
+        - label: >
+            I have asked my usage related question on [StackOverflow](https://stackoverflow.com).
+          required: true
+  - type: input
+    id: question-link
+    attributes:
+      label: Link to question on StackOverflow
+    validations:
+      required: true
+  - type: markdown
+    attributes:
+      value: ---
+  - type: textarea
+    id: question
+    attributes:
+      label: Question about pandas
+      description: >
+        **Note**: If you'd still like to submit a question, please read [this guide](
+        https://matthewrocklin.com/blog/work/2018/02/28/minimal-bug-reports) detailing
+        how to provide the necessary information for us to reproduce your question.
+      placeholder: |
+        ```python
+        # Your code here, if applicable
+
+        ```
@@ -0,0 +1,81 @@
+name: "ASV Bot"
+
+on:
+  issue_comment: # Pull requests are issues
+    types:
+      - created
+
+env:
+  ENV_FILE: environment.yml
+  COMMENT: ${{github.event.comment.body}}
+
+jobs:
+  autotune:
+    name: "Run benchmarks"
+    # TODO: Support more benchmarking options later, against different branches, against self, etc
+    if: startsWith(github.event.comment.body, '@github-actions benchmark')
+    runs-on: ubuntu-latest
+    defaults:
+      run:
+        shell: bash -l {0}
+
+    concurrency:
+      # Set concurrency to prevent abuse(full runs are ~5.5 hours !!!)
+      # each user can only run one concurrent benchmark bot at a time
+      # We don't cancel in progress jobs, but if you want to benchmark multiple PRs, you're gonna have
+      # to wait
+      group: ${{ github.actor }}-asv
+      cancel-in-progress: false
+
+    steps:
+      - name: Checkout
+        uses: actions/checkout@v2
+        with:
+          fetch-depth: 0
+
+      - name: Cache conda
+        uses: actions/cache@v2
+        with:
+          path: ~/conda_pkgs_dir
+          key: ${{ runner.os }}-conda-${{ hashFiles('${{ env.ENV_FILE }}') }}
+
+        # Although asv sets up its own env, deps are still needed
+        # during discovery process
+      - uses: conda-incubator/setup-miniconda@v2
+        with:
+          activate-environment: pandas-dev
+          channel-priority: strict
+          environment-file: ${{ env.ENV_FILE }}
+          use-only-tar-bz2: true
+
+      - name: Run benchmarks
+        id: bench
+        continue-on-error: true # This is a fake failure, asv will exit code 1 for regressions
+        run: |
+          # extracting the regex, see https://stackoverflow.com/a/36798723
+          REGEX=$(echo "$COMMENT" | sed -n "s/^.*-b\s*\(\S*\).*$/\1/p")
+          cd asv_bench
+          asv check -E existing
+          git remote add upstream https://github.com/pandas-dev/pandas.git
+          git fetch upstream
+          asv machine --yes
+          asv continuous -f 1.1 -b $REGEX upstream/master HEAD
+          echo 'BENCH_OUTPUT<<EOF' >> $GITHUB_ENV
+          asv compare -f 1.1 upstream/master HEAD >> $GITHUB_ENV
+          echo 'EOF' >> $GITHUB_ENV
+          echo "REGEX=$REGEX" >> $GITHUB_ENV
+
+      - uses: actions/github-script@v4
+        env:
+          BENCH_OUTPUT: ${{env.BENCH_OUTPUT}}
+          REGEX: ${{env.REGEX}}
+        with:
+          script: |
+            const ENV_VARS = process.env
+            const run_url = `https://github.com/${context.repo.owner}/${context.repo.repo}/actions/runs/${context.runId}`
+            github.issues.createComment({
+              issue_number: context.issue.number,
+              owner: context.repo.owner,
+              repo: context.repo.repo,
+              body: '\nBenchmarks completed. View runner logs here.' + run_url + '\nRegex used: '+ 'regex ' + ENV_VARS["REGEX"] + '\n' + ENV_VARS["BENCH_OUTPUT"]
+            })
@@ -2,7 +2,7 @@ name: "Update pre-commit config"
 
 on:
   schedule:
-    - cron: "0 7 * * 1" # At 07:00 on each Monday.
+    - cron: "0 7 1 * *" # At 07:00 on 1st of every month.
   workflow_dispatch:
 
 jobs:
 
@@ -41,7 +41,7 @@ jobs:
     - name: Install dependencies
       run: |
         python -m pip install --upgrade pip setuptools wheel
-        pip install git+https://github.com/numpy/numpy.git
+        pip install -i https://pypi.anaconda.org/scipy-wheels-nightly/simple numpy
         pip install git+https://github.com/pytest-dev/pytest.git
         pip install git+https://github.com/nedbat/coveragepy.git
         pip install cython python-dateutil pytz hypothesis pytest-xdist pytest-cov
 
@@ -164,3 +164,8 @@ repos:
         entry: python scripts/no_bool_in_generic.py
         language: python
         files: ^pandas/core/generic\.py$
+    -   id: pandas-errors-documented
+        name: Ensure pandas errors are documented in doc/source/reference/general_utility_functions.rst
+        entry: python scripts/pandas_errors_documented.py
+        language: python
+        files: ^pandas/errors/__init__.py$
@@ -46,17 +46,14 @@
         "numba": [],
         "numexpr": [],
         "pytables": [null, ""],  // platform dependent, see excludes below
+        "pyarrow": [],
         "tables": [null, ""],
         "openpyxl": [],
         "xlsxwriter": [],
         "xlrd": [],
         "xlwt": [],
         "odfpy": [],
-        "pytest": [],
         "jinja2": [],
-        // If using Windows with python 2.7 and want to build using the
-        // mingw toolchain (rather than MSVC), uncomment the following line.
-        // "libpython": [],
     },
     "conda_channels": ["defaults", "conda-forge"],
     // Combinations of libraries/python versions can be excluded/included
 
@@ -50,15 +50,26 @@ def time_pandas_dtype_invalid(self, dtype):
 
 class SelectDtypes:
 
-    params = [
-        tm.ALL_INT_DTYPES
-        + tm.ALL_EA_INT_DTYPES
-        + tm.FLOAT_DTYPES
-        + tm.COMPLEX_DTYPES
-        + tm.DATETIME64_DTYPES
-        + tm.TIMEDELTA64_DTYPES
-        + tm.BOOL_DTYPES
-    ]
+    try:
+        params = [
+            tm.ALL_INT_NUMPY_DTYPES
+            + tm.ALL_INT_EA_DTYPES
+            + tm.FLOAT_NUMPY_DTYPES
+            + tm.COMPLEX_DTYPES
+            + tm.DATETIME64_DTYPES
+            + tm.TIMEDELTA64_DTYPES
+            + tm.BOOL_DTYPES
+        ]
+    except AttributeError:
+        params = [
+            tm.ALL_INT_DTYPES
+            + tm.ALL_EA_INT_DTYPES
+            + tm.FLOAT_DTYPES
+            + tm.COMPLEX_DTYPES
+            + tm.DATETIME64_DTYPES
+            + tm.TIMEDELTA64_DTYPES
+            + tm.BOOL_DTYPES
+        ]
     param_names = ["dtype"]
 
     def setup(self, dtype):
 
@@ -2,6 +2,7 @@
 
 import pandas as pd
 from pandas import (
+    Categorical,
     DataFrame,
     MultiIndex,
     Series,
@@ -31,6 +32,9 @@ def setup(self):
         self.dict_list = frame.to_dict(orient="records")
         self.data2 = {i: {j: float(j) for j in range(100)} for i in range(2000)}
 
+        # arrays which we wont consolidate
+        self.dict_of_categoricals = {i: Categorical(np.arange(N)) for i in range(K)}
+
     def time_list_of_dict(self):
         DataFrame(self.dict_list)
 
@@ -50,6 +54,10 @@ def time_nested_dict_int64(self):
         # nested dict, integer indexes, regression described in #621
         DataFrame(self.data2)
 
+    def time_dict_of_categoricals(self):
+        # dict of arrays that we wont consolidate
+        DataFrame(self.dict_of_categoricals)
+
 
 class FromSeries:
     def setup(self):
 
@@ -542,8 +542,12 @@ class Interpolate:
     def setup(self, downcast):
         N = 10000
         # this is the worst case, where every column has NaNs.
-        self.df = DataFrame(np.random.randn(N, 100))
-        self.df.values[::2] = np.nan
+        arr = np.random.randn(N, 100)
+        # NB: we need to set values in array, not in df.values, otherwise
+        #  the benchmark will be misleading for ArrayManager
+        arr[::2] = np.nan
+
+        self.df = DataFrame(arr)
 
         self.df2 = DataFrame(
             {