diff --git a/.buildinfo b/.buildinfo
index 77ce9891..29220e7c 100644
--- a/.buildinfo
+++ b/.buildinfo
@@ -1,4 +1,4 @@
 # Sphinx build info version 1
 # This file hashes the configuration used when building these files. When it is not found, a full rebuild will be done.
-config: 8eb14ef0987ca17d9dfbb8af61480095
+config: 5d67110e4b7f3308f48f9b0005f1974e
 tags: 645f666f9bcd5a90fca523b33c5a78b7
diff --git a/.doctrees/environment.pickle b/.doctrees/environment.pickle
index 0ea6ce80..76a594ae 100644
Binary files a/.doctrees/environment.pickle and b/.doctrees/environment.pickle differ
diff --git a/.doctrees/index.doctree b/.doctrees/index.doctree
index 67805054..05761b6c 100644
Binary files a/.doctrees/index.doctree and b/.doctrees/index.doctree differ
diff --git a/.doctrees/spark_usage.doctree b/.doctrees/spark_usage.doctree
index 9d890dc8..04e52361 100644
Binary files a/.doctrees/spark_usage.doctree and b/.doctrees/spark_usage.doctree differ
diff --git a/_sources/spark_usage.rst.txt b/_sources/spark_usage.rst.txt
index e064f0fb..7bd942cd 100644
--- a/_sources/spark_usage.rst.txt
+++ b/_sources/spark_usage.rst.txt
@@ -3,15 +3,15 @@ Spark Usage
 
 .. important::
 
-    With version ``v0.12.0`` the original ``SparkCompare`` was replaced with a 
-    Pandas on Spark implementation The original ``SparkCompare`` 
-    implementation differs from all the other native implementations. To align the API better, 
-    and keep behaviour consistent we are deprecating the original ``SparkCompare`` 
+    With version ``v0.12.0`` the original ``SparkCompare`` was replaced with a
+    Pandas on Spark implementation The original ``SparkCompare``
+    implementation differs from all the other native implementations. To align the API better,
+    and keep behaviour consistent we are deprecating the original ``SparkCompare``
     into a new module ``LegacySparkCompare``
 
     Subsequently in ``v0.13.0`` a PySaprk DataFrame class has been introduced (``SparkSQLCompare``)
-    which accepts ``pyspark.sql.DataFrame`` and should provide better performance. With this version 
-    the Pandas on Spark implementation has been renamed to ``SparkPandasCompare`` and all the spark 
+    which accepts ``pyspark.sql.DataFrame`` and should provide better performance. With this version
+    the Pandas on Spark implementation has been renamed to ``SparkPandasCompare`` and all the spark
     logic is now under the ``spark`` submodule.
 
     If you wish to use the old SparkCompare moving forward you can import it like so:
@@ -19,29 +19,24 @@ Spark Usage
     .. code-block:: python
 
         from datacompy.spark.legacy import LegacySparkCompare
-    
 
-For both ``SparkSQLCompare`` and ``SparkPandasCompare``
-
-- ``on_index`` is not supported.
-- Joining is done using ``<=>`` which is the equality test that is safe for null values.
-- ``SparkPandasCompare`` compares ``pyspark.pandas.DataFrame``'s
-- ``SparkSQLCompare`` compares ``pyspark.sql.DataFrame``'s
-
-Supported Version
-------------------
 
 .. important::
 
-    Spark will not offically support Pandas 2 until Spark 4: https://issues.apache.org/jira/browse/SPARK-44101
+    Starting with ``v0.14.1``, ``SparkPandasCompare`` is slated for deprecation. ``SparkSQLCompare``
+    is the prefered and much more performant. It should be noted that if you continue to use ``SparkPandasCompare``
+    that ``numpy`` 2+ is not supported due to dependnecy issues.
+
 
+For ``SparkSQLCompare``
 
-Until then we will not be supporting Pandas 2 for the Pandas on Spark API implementaion.
-For Fugue, the Native Pandas (`Compare`), and `SparkSQLCompare` implementations, Pandas 2 is supported.
+- ``on_index`` is not supported.
+- Joining is done using ``<=>`` which is the equality test that is safe for null values.
+- ``SparkSQLCompare`` compares ``pyspark.sql.DataFrame``'s
 
 
-SparkPandasCompare and SparkSQLCompare Object Setup
----------------------------------------------------
+SparkSQLCompare
+---------------
 
 There is currently only one supported method for joining your dataframes - by
 join column(s).
@@ -52,7 +47,7 @@ join column(s).
     from io import StringIO
     import pandas as pd
     import pyspark.pandas as ps
-    from datacompy import SparkPandasCompare, SparkSQLCompare
+    from datacompy import  SparkSQLCompare
     from pyspark.sql import SparkSession
 
     spark = SparkSession.builder.getOrCreate()
@@ -73,25 +68,6 @@ join column(s).
     10000001238,1.05,Loose Seal Bluth,111
     """
 
-    # SparkPandasCompare
-    df1 = ps.from_pandas(pd.read_csv(StringIO(data1)))
-    df2 = ps.from_pandas(pd.read_csv(StringIO(data2)))
-
-    compare = SparkPandasCompare(
-        df1,
-        df2,
-        join_columns='acct_id',  # You can also specify a list of columns
-        abs_tol=0,  # Optional, defaults to 0
-        rel_tol=0,  # Optional, defaults to 0
-        df1_name='Original',  # Optional, defaults to 'df1'
-        df2_name='New'  # Optional, defaults to 'df2'
-    )
-    compare.matches(ignore_extra_columns=False)
-    # False
-    # This method prints out a human-readable report summarizing and sampling differences
-    print(compare.report())
-
-
     # SparkSQLCompare
     df1 = spark.createDataFrame(pd.read_csv(StringIO(data1)))
     df2 = spark.createDataFrame(pd.read_csv(StringIO(data2)))
diff --git a/_static/documentation_options.js b/_static/documentation_options.js
index 9242cb85..5c726b82 100644
--- a/_static/documentation_options.js
+++ b/_static/documentation_options.js
@@ -1,5 +1,5 @@
 const DOCUMENTATION_OPTIONS = {
-    VERSION: '0.14.0',
+    VERSION: '0.14.1',
     LANGUAGE: 'en',
     COLLAPSE_INDEX: false,
     BUILDER: 'html',
diff --git a/api/datacompy.html b/api/datacompy.html
index dfe06df6..0a34a8da 100644
--- a/api/datacompy.html
+++ b/api/datacompy.html
@@ -6,7 +6,7 @@
 <link rel="index" title="Index" href="../genindex.html" /><link rel="search" title="Search" href="../search.html" /><link rel="next" title="datacompy.spark package" href="datacompy.spark.html" /><link rel="prev" title="datacompy" href="modules.html" />
 
     <!-- Generated with Sphinx 7.4.7 and Furo 2024.08.06 -->
-        <title>datacompy package - datacompy 0.14.0 documentation</title>
+        <title>datacompy package - datacompy 0.14.1 documentation</title>
       <link rel="stylesheet" type="text/css" href="../_static/pygments.css?v=fa44fd50" />
     <link rel="stylesheet" type="text/css" href="../_static/styles/furo.css?v=354aac6f" />
     <link rel="stylesheet" type="text/css" href="../_static/styles/furo-extensions.css?v=302659d7" />
@@ -166,7 +166,7 @@
       </label>
     </div>
     <div class="header-center">
-      <a href="../index.html"><div class="brand">datacompy 0.14.0 documentation</div></a>
+      <a href="../index.html"><div class="brand">datacompy 0.14.1 documentation</div></a>
     </div>
     <div class="header-right">
       <div class="theme-toggle-container theme-toggle-header">
@@ -190,7 +190,7 @@
       <div class="sidebar-sticky"><a class="sidebar-brand" href="../index.html">
   
   
-  <span class="sidebar-brand-text">datacompy 0.14.0 documentation</span>
+  <span class="sidebar-brand-text">datacompy 0.14.1 documentation</span>
   
 </a><form class="sidebar-search-container" method="get" action="../search.html" role="search">
   <input class="sidebar-search" placeholder="Search" name="q" aria-label="Search">
@@ -2962,7 +2962,7 @@ <h2>Submodules<a class="headerlink" href="#submodules" title="Link to this headi
       
     </aside>
   </div>
-</div><script src="../_static/documentation_options.js?v=9e420a66"></script>
+</div><script src="../_static/documentation_options.js?v=3a3a8e7f"></script>
     <script src="../_static/doctools.js?v=9a2dae69"></script>
     <script src="../_static/sphinx_highlight.js?v=dc90522c"></script>
     <script src="../_static/scripts/furo.js?v=5fa4622c"></script>
diff --git a/api/datacompy.spark.html b/api/datacompy.spark.html
index 74fee629..88a07e00 100644
--- a/api/datacompy.spark.html
+++ b/api/datacompy.spark.html
@@ -6,7 +6,7 @@
 <link rel="index" title="Index" href="../genindex.html" /><link rel="search" title="Search" href="../search.html" /><link rel="prev" title="datacompy package" href="datacompy.html" />
 
     <!-- Generated with Sphinx 7.4.7 and Furo 2024.08.06 -->
-        <title>datacompy.spark package - datacompy 0.14.0 documentation</title>
+        <title>datacompy.spark package - datacompy 0.14.1 documentation</title>
       <link rel="stylesheet" type="text/css" href="../_static/pygments.css?v=fa44fd50" />
     <link rel="stylesheet" type="text/css" href="../_static/styles/furo.css?v=354aac6f" />
     <link rel="stylesheet" type="text/css" href="../_static/styles/furo-extensions.css?v=302659d7" />
@@ -166,7 +166,7 @@
       </label>
     </div>
     <div class="header-center">
-      <a href="../index.html"><div class="brand">datacompy 0.14.0 documentation</div></a>
+      <a href="../index.html"><div class="brand">datacompy 0.14.1 documentation</div></a>
     </div>
     <div class="header-right">
       <div class="theme-toggle-container theme-toggle-header">
@@ -190,7 +190,7 @@
       <div class="sidebar-sticky"><a class="sidebar-brand" href="../index.html">
   
   
-  <span class="sidebar-brand-text">datacompy 0.14.0 documentation</span>
+  <span class="sidebar-brand-text">datacompy 0.14.1 documentation</span>
   
 </a><form class="sidebar-search-container" method="get" action="../search.html" role="search">
   <input class="sidebar-search" placeholder="Search" name="q" aria-label="Search">
@@ -1354,7 +1354,7 @@ <h2>Submodules<a class="headerlink" href="#submodules" title="Link to this headi
       
     </aside>
   </div>
-</div><script src="../_static/documentation_options.js?v=9e420a66"></script>
+</div><script src="../_static/documentation_options.js?v=3a3a8e7f"></script>
     <script src="../_static/doctools.js?v=9a2dae69"></script>
     <script src="../_static/sphinx_highlight.js?v=dc90522c"></script>
     <script src="../_static/scripts/furo.js?v=5fa4622c"></script>
diff --git a/api/modules.html b/api/modules.html
index f03f8b50..fd630e2d 100644
--- a/api/modules.html
+++ b/api/modules.html
@@ -6,7 +6,7 @@
 <link rel="index" title="Index" href="../genindex.html" /><link rel="search" title="Search" href="../search.html" /><link rel="next" title="datacompy package" href="datacompy.html" /><link rel="prev" title="Developer Instructions" href="../developer_instructions.html" />
 
     <!-- Generated with Sphinx 7.4.7 and Furo 2024.08.06 -->
-        <title>datacompy - datacompy 0.14.0 documentation</title>
+        <title>datacompy - datacompy 0.14.1 documentation</title>
       <link rel="stylesheet" type="text/css" href="../_static/pygments.css?v=fa44fd50" />
     <link rel="stylesheet" type="text/css" href="../_static/styles/furo.css?v=354aac6f" />
     <link rel="stylesheet" type="text/css" href="../_static/styles/furo-extensions.css?v=302659d7" />
@@ -166,7 +166,7 @@
       </label>
     </div>
     <div class="header-center">
-      <a href="../index.html"><div class="brand">datacompy 0.14.0 documentation</div></a>
+      <a href="../index.html"><div class="brand">datacompy 0.14.1 documentation</div></a>
     </div>
     <div class="header-right">
       <div class="theme-toggle-container theme-toggle-header">
@@ -190,7 +190,7 @@
       <div class="sidebar-sticky"><a class="sidebar-brand" href="../index.html">
   
   
-  <span class="sidebar-brand-text">datacompy 0.14.0 documentation</span>
+  <span class="sidebar-brand-text">datacompy 0.14.1 documentation</span>
   
 </a><form class="sidebar-search-container" method="get" action="../search.html" role="search">
   <input class="sidebar-search" placeholder="Search" name="q" aria-label="Search">
@@ -514,7 +514,7 @@ <h1>datacompy<a class="headerlink" href="#datacompy" title="Link to this heading
       
     </aside>
   </div>
-</div><script src="../_static/documentation_options.js?v=9e420a66"></script>
+</div><script src="../_static/documentation_options.js?v=3a3a8e7f"></script>
     <script src="../_static/doctools.js?v=9a2dae69"></script>
     <script src="../_static/sphinx_highlight.js?v=dc90522c"></script>
     <script src="../_static/scripts/furo.js?v=5fa4622c"></script>
diff --git a/benchmark.html b/benchmark.html
index d8f740be..af98c877 100644
--- a/benchmark.html
+++ b/benchmark.html
@@ -6,7 +6,7 @@
 <link rel="index" title="Index" href="genindex.html" /><link rel="search" title="Search" href="search.html" /><link rel="next" title="Developer Instructions" href="developer_instructions.html" /><link rel="prev" title="Fugue Detail" href="fugue_usage.html" />
 
     <!-- Generated with Sphinx 7.4.7 and Furo 2024.08.06 -->
-        <title>Benchmarks - datacompy 0.14.0 documentation</title>
+        <title>Benchmarks - datacompy 0.14.1 documentation</title>
       <link rel="stylesheet" type="text/css" href="_static/pygments.css?v=fa44fd50" />
     <link rel="stylesheet" type="text/css" href="_static/styles/furo.css?v=354aac6f" />
     <link rel="stylesheet" type="text/css" href="_static/styles/furo-extensions.css?v=302659d7" />
@@ -166,7 +166,7 @@
       </label>
     </div>
     <div class="header-center">
-      <a href="index.html"><div class="brand">datacompy 0.14.0 documentation</div></a>
+      <a href="index.html"><div class="brand">datacompy 0.14.1 documentation</div></a>
     </div>
     <div class="header-right">
       <div class="theme-toggle-container theme-toggle-header">
@@ -190,7 +190,7 @@
       <div class="sidebar-sticky"><a class="sidebar-brand" href="index.html">
   
   
-  <span class="sidebar-brand-text">datacompy 0.14.0 documentation</span>
+  <span class="sidebar-brand-text">datacompy 0.14.1 documentation</span>
   
 </a><form class="sidebar-search-container" method="get" action="search.html" role="search">
   <input class="sidebar-search" placeholder="Search" name="q" aria-label="Search">
@@ -465,7 +465,7 @@ <h2>TLDR<a class="headerlink" href="#tldr" title="Link to this heading">¶</a></
       
     </aside>
   </div>
-</div><script src="_static/documentation_options.js?v=9e420a66"></script>
+</div><script src="_static/documentation_options.js?v=3a3a8e7f"></script>
     <script src="_static/doctools.js?v=9a2dae69"></script>
     <script src="_static/sphinx_highlight.js?v=dc90522c"></script>
     <script src="_static/scripts/furo.js?v=5fa4622c"></script>
diff --git a/developer_instructions.html b/developer_instructions.html
index f3998a7a..91c4af0d 100644
--- a/developer_instructions.html
+++ b/developer_instructions.html
@@ -6,7 +6,7 @@
 <link rel="index" title="Index" href="genindex.html" /><link rel="search" title="Search" href="search.html" /><link rel="next" title="datacompy" href="api/modules.html" /><link rel="prev" title="Benchmarks" href="benchmark.html" />
 
     <!-- Generated with Sphinx 7.4.7 and Furo 2024.08.06 -->
-        <title>Developer Instructions - datacompy 0.14.0 documentation</title>
+        <title>Developer Instructions - datacompy 0.14.1 documentation</title>
       <link rel="stylesheet" type="text/css" href="_static/pygments.css?v=fa44fd50" />
     <link rel="stylesheet" type="text/css" href="_static/styles/furo.css?v=354aac6f" />
     <link rel="stylesheet" type="text/css" href="_static/styles/furo-extensions.css?v=302659d7" />
@@ -166,7 +166,7 @@
       </label>
     </div>
     <div class="header-center">
-      <a href="index.html"><div class="brand">datacompy 0.14.0 documentation</div></a>
+      <a href="index.html"><div class="brand">datacompy 0.14.1 documentation</div></a>
     </div>
     <div class="header-right">
       <div class="theme-toggle-container theme-toggle-header">
@@ -190,7 +190,7 @@
       <div class="sidebar-sticky"><a class="sidebar-brand" href="index.html">
   
   
-  <span class="sidebar-brand-text">datacompy 0.14.0 documentation</span>
+  <span class="sidebar-brand-text">datacompy 0.14.1 documentation</span>
   
 </a><form class="sidebar-search-container" method="get" action="search.html" role="search">
   <input class="sidebar-search" placeholder="Search" name="q" aria-label="Search">
@@ -438,7 +438,7 @@ <h2>Generating distribution archives (PyPI)<a class="headerlink" href="#generati
       
     </aside>
   </div>
-</div><script src="_static/documentation_options.js?v=9e420a66"></script>
+</div><script src="_static/documentation_options.js?v=3a3a8e7f"></script>
     <script src="_static/doctools.js?v=9a2dae69"></script>
     <script src="_static/sphinx_highlight.js?v=dc90522c"></script>
     <script src="_static/scripts/furo.js?v=5fa4622c"></script>
diff --git a/fugue_usage.html b/fugue_usage.html
index 81b6d67d..192b160b 100644
--- a/fugue_usage.html
+++ b/fugue_usage.html
@@ -6,7 +6,7 @@
 <link rel="index" title="Index" href="genindex.html" /><link rel="search" title="Search" href="search.html" /><link rel="next" title="Benchmarks" href="benchmark.html" /><link rel="prev" title="Polars Usage" href="polars_usage.html" />
 
     <!-- Generated with Sphinx 7.4.7 and Furo 2024.08.06 -->
-        <title>Fugue Detail - datacompy 0.14.0 documentation</title>
+        <title>Fugue Detail - datacompy 0.14.1 documentation</title>
       <link rel="stylesheet" type="text/css" href="_static/pygments.css?v=fa44fd50" />
     <link rel="stylesheet" type="text/css" href="_static/styles/furo.css?v=354aac6f" />
     <link rel="stylesheet" type="text/css" href="_static/styles/furo-extensions.css?v=302659d7" />
@@ -166,7 +166,7 @@
       </label>
     </div>
     <div class="header-center">
-      <a href="index.html"><div class="brand">datacompy 0.14.0 documentation</div></a>
+      <a href="index.html"><div class="brand">datacompy 0.14.1 documentation</div></a>
     </div>
     <div class="header-right">
       <div class="theme-toggle-container theme-toggle-header">
@@ -190,7 +190,7 @@
       <div class="sidebar-sticky"><a class="sidebar-brand" href="index.html">
   
   
-  <span class="sidebar-brand-text">datacompy 0.14.0 documentation</span>
+  <span class="sidebar-brand-text">datacompy 0.14.1 documentation</span>
   
 </a><form class="sidebar-search-container" method="get" action="search.html" role="search">
   <input class="sidebar-search" placeholder="Search" name="q" aria-label="Search">
@@ -433,7 +433,7 @@ <h2>Future releases<a class="headerlink" href="#future-releases" title="Link to
       
     </aside>
   </div>
-</div><script src="_static/documentation_options.js?v=9e420a66"></script>
+</div><script src="_static/documentation_options.js?v=3a3a8e7f"></script>
     <script src="_static/doctools.js?v=9a2dae69"></script>
     <script src="_static/sphinx_highlight.js?v=dc90522c"></script>
     <script src="_static/scripts/furo.js?v=5fa4622c"></script>
diff --git a/genindex.html b/genindex.html
index 750c2d92..b0ac2293 100644
--- a/genindex.html
+++ b/genindex.html
@@ -4,7 +4,7 @@
     <meta name="viewport" content="width=device-width,initial-scale=1"/>
     <meta name="color-scheme" content="light dark"><link rel="index" title="Index" href="#" /><link rel="search" title="Search" href="search.html" />
 
-    <!-- Generated with Sphinx 7.4.7 and Furo 2024.08.06 --><title>Index - datacompy 0.14.0 documentation</title>
+    <!-- Generated with Sphinx 7.4.7 and Furo 2024.08.06 --><title>Index - datacompy 0.14.1 documentation</title>
 <link rel="stylesheet" type="text/css" href="_static/pygments.css?v=fa44fd50" />
     <link rel="stylesheet" type="text/css" href="_static/styles/furo.css?v=354aac6f" />
     <link rel="stylesheet" type="text/css" href="_static/styles/furo-extensions.css?v=302659d7" />
@@ -164,7 +164,7 @@
       </label>
     </div>
     <div class="header-center">
-      <a href="index.html"><div class="brand">datacompy 0.14.0 documentation</div></a>
+      <a href="index.html"><div class="brand">datacompy 0.14.1 documentation</div></a>
     </div>
     <div class="header-right">
       <div class="theme-toggle-container theme-toggle-header">
@@ -188,7 +188,7 @@
       <div class="sidebar-sticky"><a class="sidebar-brand" href="index.html">
   
   
-  <span class="sidebar-brand-text">datacompy 0.14.0 documentation</span>
+  <span class="sidebar-brand-text">datacompy 0.14.1 documentation</span>
   
 </a><form class="sidebar-search-container" method="get" action="search.html" role="search">
   <input class="sidebar-search" placeholder="Search" name="q" aria-label="Search">
@@ -988,7 +988,7 @@ <h2>U</h2>
       
     </aside>
   </div>
-</div><script src="_static/documentation_options.js?v=9e420a66"></script>
+</div><script src="_static/documentation_options.js?v=3a3a8e7f"></script>
     <script src="_static/doctools.js?v=9a2dae69"></script>
     <script src="_static/sphinx_highlight.js?v=dc90522c"></script>
     <script src="_static/scripts/furo.js?v=5fa4622c"></script>
diff --git a/index.html b/index.html
index 49687b31..6942b0f9 100644
--- a/index.html
+++ b/index.html
@@ -6,7 +6,7 @@
 <link rel="index" title="Index" href="genindex.html" /><link rel="search" title="Search" href="search.html" /><link rel="next" title="Installation" href="install.html" />
 
     <!-- Generated with Sphinx 7.4.7 and Furo 2024.08.06 -->
-        <title>datacompy 0.14.0 documentation</title>
+        <title>datacompy 0.14.1 documentation</title>
       <link rel="stylesheet" type="text/css" href="_static/pygments.css?v=fa44fd50" />
     <link rel="stylesheet" type="text/css" href="_static/styles/furo.css?v=354aac6f" />
     <link rel="stylesheet" type="text/css" href="_static/styles/furo-extensions.css?v=302659d7" />
@@ -166,7 +166,7 @@
       </label>
     </div>
     <div class="header-center">
-      <a href="#"><div class="brand">datacompy 0.14.0 documentation</div></a>
+      <a href="#"><div class="brand">datacompy 0.14.1 documentation</div></a>
     </div>
     <div class="header-right">
       <div class="theme-toggle-container theme-toggle-header">
@@ -190,7 +190,7 @@
       <div class="sidebar-sticky"><a class="sidebar-brand" href="#">
   
   
-  <span class="sidebar-brand-text">datacompy 0.14.0 documentation</span>
+  <span class="sidebar-brand-text">datacompy 0.14.1 documentation</span>
   
 </a><form class="sidebar-search-container" method="get" action="search.html" role="search">
   <input class="sidebar-search" placeholder="Search" name="q" aria-label="Search">
@@ -302,6 +302,11 @@ <h3>Legacy Spark Deprecation<a class="headerlink" href="#legacy-spark-deprecatio
 <div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="kn">from</span> <span class="nn">datacompy.spark.legacy</span> <span class="kn">import</span> <span class="n">LegacySparkCompare</span>
 </pre></div>
 </div>
+</section>
+<section id="sparkpandascompare-deprecation">
+<h3>SparkPandasCompare Deprecation<a class="headerlink" href="#sparkpandascompare-deprecation" title="Link to this heading">¶</a></h3>
+<p>Starting with <code class="docutils literal notranslate"><span class="pre">v0.14.1</span></code>, <code class="docutils literal notranslate"><span class="pre">SparkPandasCompare</span></code> is slated for deprecation. <code class="docutils literal notranslate"><span class="pre">SparkSQLCompare</span></code> is the prefered and much more performant.
+It should be noted that if you continue to use <code class="docutils literal notranslate"><span class="pre">SparkPandasCompare</span></code> that <code class="docutils literal notranslate"><span class="pre">numpy</span></code> 2+ is not supported due to dependency issues.</p>
 <section id="supported-versions-and-dependncies">
 <h4>Supported versions and dependncies<a class="headerlink" href="#supported-versions-and-dependncies" title="Link to this heading">¶</a></h4>
 <p>Different versions of Spark, Pandas, and Python interact differently. Below is a matrix of what we test with.
@@ -426,8 +431,7 @@ <h1>Contents<a class="headerlink" href="#contents" title="Link to this heading">
 </ul>
 </li>
 <li class="toctree-l1"><a class="reference internal" href="spark_usage.html">Spark Usage</a><ul>
-<li class="toctree-l2"><a class="reference internal" href="spark_usage.html#supported-version">Supported Version</a></li>
-<li class="toctree-l2"><a class="reference internal" href="spark_usage.html#sparkpandascompare-and-sparksqlcompare-object-setup">SparkPandasCompare and SparkSQLCompare Object Setup</a></li>
+<li class="toctree-l2"><a class="reference internal" href="spark_usage.html#sparksqlcompare">SparkSQLCompare</a></li>
 <li class="toctree-l2"><a class="reference internal" href="spark_usage.html#reports">Reports</a></li>
 <li class="toctree-l2"><a class="reference internal" href="spark_usage.html#convenience-methods">Convenience Methods</a></li>
 <li class="toctree-l2"><a class="reference internal" href="spark_usage.html#duplicate-rows">Duplicate rows</a></li>
@@ -600,7 +604,8 @@ <h1>Indices and tables<a class="headerlink" href="#indices-and-tables" title="Li
 <li><a class="reference internal" href="#">DataComPy</a><ul>
 <li><a class="reference internal" href="#quick-installation">Quick Installation</a><ul>
 <li><a class="reference internal" href="#installing-extras">Installing extras</a></li>
-<li><a class="reference internal" href="#legacy-spark-deprecation">Legacy Spark Deprecation</a><ul>
+<li><a class="reference internal" href="#legacy-spark-deprecation">Legacy Spark Deprecation</a></li>
+<li><a class="reference internal" href="#sparkpandascompare-deprecation">SparkPandasCompare Deprecation</a><ul>
 <li><a class="reference internal" href="#supported-versions-and-dependncies">Supported versions and dependncies</a></li>
 </ul>
 </li>
@@ -624,7 +629,7 @@ <h1>Indices and tables<a class="headerlink" href="#indices-and-tables" title="Li
       
     </aside>
   </div>
-</div><script src="_static/documentation_options.js?v=9e420a66"></script>
+</div><script src="_static/documentation_options.js?v=3a3a8e7f"></script>
     <script src="_static/doctools.js?v=9a2dae69"></script>
     <script src="_static/sphinx_highlight.js?v=dc90522c"></script>
     <script src="_static/scripts/furo.js?v=5fa4622c"></script>
diff --git a/install.html b/install.html
index 996d2274..0b3843e4 100644
--- a/install.html
+++ b/install.html
@@ -6,7 +6,7 @@
 <link rel="index" title="Index" href="genindex.html" /><link rel="search" title="Search" href="search.html" /><link rel="next" title="Pandas Usage" href="pandas_usage.html" /><link rel="prev" title="DataComPy" href="index.html" />
 
     <!-- Generated with Sphinx 7.4.7 and Furo 2024.08.06 -->
-        <title>Installation - datacompy 0.14.0 documentation</title>
+        <title>Installation - datacompy 0.14.1 documentation</title>
       <link rel="stylesheet" type="text/css" href="_static/pygments.css?v=fa44fd50" />
     <link rel="stylesheet" type="text/css" href="_static/styles/furo.css?v=354aac6f" />
     <link rel="stylesheet" type="text/css" href="_static/styles/furo-extensions.css?v=302659d7" />
@@ -166,7 +166,7 @@
       </label>
     </div>
     <div class="header-center">
-      <a href="index.html"><div class="brand">datacompy 0.14.0 documentation</div></a>
+      <a href="index.html"><div class="brand">datacompy 0.14.1 documentation</div></a>
     </div>
     <div class="header-right">
       <div class="theme-toggle-container theme-toggle-header">
@@ -190,7 +190,7 @@
       <div class="sidebar-sticky"><a class="sidebar-brand" href="index.html">
   
   
-  <span class="sidebar-brand-text">datacompy 0.14.0 documentation</span>
+  <span class="sidebar-brand-text">datacompy 0.14.1 documentation</span>
   
 </a><form class="sidebar-search-container" method="get" action="search.html" role="search">
   <input class="sidebar-search" placeholder="Search" name="q" aria-label="Search">
@@ -361,7 +361,7 @@ <h2>virtualenv (install dependencies from PyPI)<a class="headerlink" href="#virt
       
     </aside>
   </div>
-</div><script src="_static/documentation_options.js?v=9e420a66"></script>
+</div><script src="_static/documentation_options.js?v=3a3a8e7f"></script>
     <script src="_static/doctools.js?v=9a2dae69"></script>
     <script src="_static/sphinx_highlight.js?v=dc90522c"></script>
     <script src="_static/scripts/furo.js?v=5fa4622c"></script>
diff --git a/objects.inv b/objects.inv
index 59926bf6..a8dcdefd 100644
Binary files a/objects.inv and b/objects.inv differ
diff --git a/pandas_usage.html b/pandas_usage.html
index c64b0cf9..4b16759b 100644
--- a/pandas_usage.html
+++ b/pandas_usage.html
@@ -6,7 +6,7 @@
 <link rel="index" title="Index" href="genindex.html" /><link rel="search" title="Search" href="search.html" /><link rel="next" title="Spark Usage" href="spark_usage.html" /><link rel="prev" title="Installation" href="install.html" />
 
     <!-- Generated with Sphinx 7.4.7 and Furo 2024.08.06 -->
-        <title>Pandas Usage - datacompy 0.14.0 documentation</title>
+        <title>Pandas Usage - datacompy 0.14.1 documentation</title>
       <link rel="stylesheet" type="text/css" href="_static/pygments.css?v=fa44fd50" />
     <link rel="stylesheet" type="text/css" href="_static/styles/furo.css?v=354aac6f" />
     <link rel="stylesheet" type="text/css" href="_static/styles/furo-extensions.css?v=302659d7" />
@@ -166,7 +166,7 @@
       </label>
     </div>
     <div class="header-center">
-      <a href="index.html"><div class="brand">datacompy 0.14.0 documentation</div></a>
+      <a href="index.html"><div class="brand">datacompy 0.14.1 documentation</div></a>
     </div>
     <div class="header-right">
       <div class="theme-toggle-container theme-toggle-header">
@@ -190,7 +190,7 @@
       <div class="sidebar-sticky"><a class="sidebar-brand" href="index.html">
   
   
-  <span class="sidebar-brand-text">datacompy 0.14.0 documentation</span>
+  <span class="sidebar-brand-text">datacompy 0.14.1 documentation</span>
   
 </a><form class="sidebar-search-container" method="get" action="search.html" role="search">
   <input class="sidebar-search" placeholder="Search" name="q" aria-label="Search">
@@ -737,7 +737,7 @@ <h2>Convenience Methods<a class="headerlink" href="#convenience-methods" title="
       
     </aside>
   </div>
-</div><script src="_static/documentation_options.js?v=9e420a66"></script>
+</div><script src="_static/documentation_options.js?v=3a3a8e7f"></script>
     <script src="_static/doctools.js?v=9a2dae69"></script>
     <script src="_static/sphinx_highlight.js?v=dc90522c"></script>
     <script src="_static/scripts/furo.js?v=5fa4622c"></script>
diff --git a/polars_usage.html b/polars_usage.html
index fe74676b..14c891d1 100644
--- a/polars_usage.html
+++ b/polars_usage.html
@@ -6,7 +6,7 @@
 <link rel="index" title="Index" href="genindex.html" /><link rel="search" title="Search" href="search.html" /><link rel="next" title="Fugue Detail" href="fugue_usage.html" /><link rel="prev" title="Spark Usage" href="spark_usage.html" />
 
     <!-- Generated with Sphinx 7.4.7 and Furo 2024.08.06 -->
-        <title>Polars Usage - datacompy 0.14.0 documentation</title>
+        <title>Polars Usage - datacompy 0.14.1 documentation</title>
       <link rel="stylesheet" type="text/css" href="_static/pygments.css?v=fa44fd50" />
     <link rel="stylesheet" type="text/css" href="_static/styles/furo.css?v=354aac6f" />
     <link rel="stylesheet" type="text/css" href="_static/styles/furo-extensions.css?v=302659d7" />
@@ -166,7 +166,7 @@
       </label>
     </div>
     <div class="header-center">
-      <a href="index.html"><div class="brand">datacompy 0.14.0 documentation</div></a>
+      <a href="index.html"><div class="brand">datacompy 0.14.1 documentation</div></a>
     </div>
     <div class="header-right">
       <div class="theme-toggle-container theme-toggle-header">
@@ -190,7 +190,7 @@
       <div class="sidebar-sticky"><a class="sidebar-brand" href="index.html">
   
   
-  <span class="sidebar-brand-text">datacompy 0.14.0 documentation</span>
+  <span class="sidebar-brand-text">datacompy 0.14.1 documentation</span>
   
 </a><form class="sidebar-search-container" method="get" action="search.html" role="search">
   <input class="sidebar-search" placeholder="Search" name="q" aria-label="Search">
@@ -534,7 +534,7 @@ <h2>Caveats and Limitations<a class="headerlink" href="#caveats-and-limitations"
       
     </aside>
   </div>
-</div><script src="_static/documentation_options.js?v=9e420a66"></script>
+</div><script src="_static/documentation_options.js?v=3a3a8e7f"></script>
     <script src="_static/doctools.js?v=9a2dae69"></script>
     <script src="_static/sphinx_highlight.js?v=dc90522c"></script>
     <script src="_static/scripts/furo.js?v=5fa4622c"></script>
diff --git a/py-modindex.html b/py-modindex.html
index fbdcef39..1a3de0c8 100644
--- a/py-modindex.html
+++ b/py-modindex.html
@@ -4,7 +4,7 @@
     <meta name="viewport" content="width=device-width,initial-scale=1"/>
     <meta name="color-scheme" content="light dark"><link rel="index" title="Index" href="genindex.html" /><link rel="search" title="Search" href="search.html" />
 
-    <!-- Generated with Sphinx 7.4.7 and Furo 2024.08.06 --><title>Python Module Index - datacompy 0.14.0 documentation</title>
+    <!-- Generated with Sphinx 7.4.7 and Furo 2024.08.06 --><title>Python Module Index - datacompy 0.14.1 documentation</title>
 <link rel="stylesheet" type="text/css" href="_static/pygments.css?v=fa44fd50" />
     <link rel="stylesheet" type="text/css" href="_static/styles/furo.css?v=354aac6f" />
     <link rel="stylesheet" type="text/css" href="_static/styles/furo-extensions.css?v=302659d7" />
@@ -164,7 +164,7 @@
       </label>
     </div>
     <div class="header-center">
-      <a href="index.html"><div class="brand">datacompy 0.14.0 documentation</div></a>
+      <a href="index.html"><div class="brand">datacompy 0.14.1 documentation</div></a>
     </div>
     <div class="header-right">
       <div class="theme-toggle-container theme-toggle-header">
@@ -188,7 +188,7 @@
       <div class="sidebar-sticky"><a class="sidebar-brand" href="index.html">
   
   
-  <span class="sidebar-brand-text">datacompy 0.14.0 documentation</span>
+  <span class="sidebar-brand-text">datacompy 0.14.1 documentation</span>
   
 </a><form class="sidebar-search-container" method="get" action="search.html" role="search">
   <input class="sidebar-search" placeholder="Search" name="q" aria-label="Search">
@@ -349,7 +349,7 @@ <h1>Python Module Index</h1>
       
     </aside>
   </div>
-</div><script src="_static/documentation_options.js?v=9e420a66"></script>
+</div><script src="_static/documentation_options.js?v=3a3a8e7f"></script>
     <script src="_static/doctools.js?v=9a2dae69"></script>
     <script src="_static/sphinx_highlight.js?v=dc90522c"></script>
     <script src="_static/scripts/furo.js?v=5fa4622c"></script>
diff --git a/search.html b/search.html
index 07d1d922..750fa8a5 100644
--- a/search.html
+++ b/search.html
@@ -7,7 +7,7 @@
 
     <!-- Generated with Sphinx 7.4.7 and Furo 2024.08.06 -->
 <meta name="robots" content="noindex" />
-<title>Search - datacompy 0.14.0 documentation</title><link rel="stylesheet" type="text/css" href="_static/pygments.css?v=fa44fd50" />
+<title>Search - datacompy 0.14.1 documentation</title><link rel="stylesheet" type="text/css" href="_static/pygments.css?v=fa44fd50" />
     <link rel="stylesheet" type="text/css" href="_static/styles/furo.css?v=354aac6f" />
     <link rel="stylesheet" type="text/css" href="_static/styles/furo-extensions.css?v=302659d7" />
     
@@ -166,7 +166,7 @@
       </label>
     </div>
     <div class="header-center">
-      <a href="index.html"><div class="brand">datacompy 0.14.0 documentation</div></a>
+      <a href="index.html"><div class="brand">datacompy 0.14.1 documentation</div></a>
     </div>
     <div class="header-right">
       <div class="theme-toggle-container theme-toggle-header">
@@ -190,7 +190,7 @@
       <div class="sidebar-sticky"><a class="sidebar-brand" href="index.html">
   
   
-  <span class="sidebar-brand-text">datacompy 0.14.0 documentation</span>
+  <span class="sidebar-brand-text">datacompy 0.14.1 documentation</span>
   
 </a><form class="sidebar-search-container" method="get" action="#" role="search">
   <input class="sidebar-search" placeholder="Search" name="q" aria-label="Search">
@@ -294,7 +294,7 @@
       
     </aside>
   </div>
-</div><script src="_static/documentation_options.js?v=9e420a66"></script>
+</div><script src="_static/documentation_options.js?v=3a3a8e7f"></script>
     <script src="_static/doctools.js?v=9a2dae69"></script>
     <script src="_static/sphinx_highlight.js?v=dc90522c"></script>
     <script src="_static/scripts/furo.js?v=5fa4622c"></script>
diff --git a/searchindex.js b/searchindex.js
index de8c2b4f..258b7abe 100644
--- a/searchindex.js
+++ b/searchindex.js
@@ -1 +1 @@
-Search.setIndex({"alltitles": {"API Reference": [[6, null]], "Basic Usage": [[5, "basic-usage"], [9, "basic-usage"]], "Benchmarks": [[3, null]], "Caveats": [[8, "caveats"]], "Caveats and Limitations": [[9, "caveats-and-limitations"]], "Compare Object Setup": [[8, "compare-object-setup"], [9, "compare-object-setup"]], "Contents": [[6, "contents"]], "Contributors": [[6, "contributors"]], "Convenience Methods": [[8, "convenience-methods"], [9, "convenience-methods"], [10, "convenience-methods"]], "Cross Comparing": [[5, "cross-comparing"]], "DataComPy": [[6, null]], "Developer Instructions": [[4, null]], "Duplicate rows": [[8, "duplicate-rows"], [9, "duplicate-rows"], [10, "duplicate-rows"]], "Fugue Detail": [[5, null]], "Future releases": [[5, "future-releases"]], "Generating Documentation": [[4, "generating-documentation"]], "Generating distribution archives (PyPI)": [[4, "generating-distribution-archives-pypi"]], "How it works": [[5, "how-it-works"]], "Indices and tables": [[6, "indices-and-tables"]], "Installation": [[7, null]], "Installing extras": [[6, "installing-extras"]], "Legacy Spark Deprecation": [[6, "legacy-spark-deprecation"]], "Limitations": [[8, "limitations"]], "Management of Requirements": [[4, "management-of-requirements"]], "Module contents": [[0, "module-datacompy"], [1, "module-datacompy.spark"]], "Overview": [[8, "overview"], [9, "overview"]], "Pandas Usage": [[8, null]], "Polars Usage": [[9, null]], "Pre-Commit Hooks": [[4, "pre-commit-hooks"]], "PyPI (basic)": [[7, "pypi-basic"]], "Quick Installation": [[6, "quick-installation"]], "Release Guide": [[4, "release-guide"]], "Reports": [[8, "reports"], [9, "reports"], [10, "reports"]], "Roadmap": [[6, "roadmap"]], "Run unit tests": [[4, "run-unit-tests"]], "Setup used": [[3, "setup-used"]], "Spark Usage": [[10, null]], "SparkPandasCompare and SparkSQLCompare Object Setup": [[10, "sparkpandascompare-and-sparksqlcompare-object-setup"]], "Submodules": [[0, "submodules"], [1, "submodules"]], "Subpackages": [[0, "subpackages"]], "Supported Version": [[10, "supported-version"]], "Supported backends": [[6, "supported-backends"]], "Supported versions and dependncies": [[6, "supported-versions-and-dependncies"]], "TLDR": [[3, "tldr"]], "The Data": [[3, "the-data"]], "conda (installs dependencies from Conda Forge)": [[7, "conda-installs-dependencies-from-conda-forge"]], "datacompy": [[2, null]], "datacompy package": [[0, null]], "datacompy.base module": [[0, "module-datacompy.base"]], "datacompy.core module": [[0, "module-datacompy.core"]], "datacompy.fugue module": [[0, "module-datacompy.fugue"]], "datacompy.polars module": [[0, "module-datacompy.polars"]], "datacompy.spark package": [[1, null]], "datacompy.spark.legacy module": [[1, "module-datacompy.spark.legacy"]], "datacompy.spark.pandas module": [[1, "module-datacompy.spark.pandas"]], "datacompy.spark.sql module": [[1, "module-datacompy.spark.sql"]], "edgetest": [[4, "edgetest"]], "virtualenv (install dependencies from PyPI)": [[7, "virtualenv-install-dependencies-from-pypi"]]}, "docnames": ["api/datacompy", "api/datacompy.spark", "api/modules", "benchmark", "developer_instructions", "fugue_usage", "index", "install", "pandas_usage", "polars_usage", "spark_usage"], "envversion": {"sphinx": 62, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2}, "filenames": ["api/datacompy.rst", "api/datacompy.spark.rst", "api/modules.rst", "benchmark.rst", "developer_instructions.rst", "fugue_usage.rst", "index.rst", "install.rst", "pandas_usage.rst", "polars_usage.rst", "spark_usage.rst"], "indexentries": {"all_columns_match() (datacompy.base.basecompare method)": [[0, "datacompy.base.BaseCompare.all_columns_match", false]], "all_columns_match() (datacompy.basecompare method)": [[0, "datacompy.BaseCompare.all_columns_match", false]], "all_columns_match() (datacompy.compare method)": [[0, "datacompy.Compare.all_columns_match", false]], "all_columns_match() (datacompy.core.compare method)": [[0, "datacompy.core.Compare.all_columns_match", false]], "all_columns_match() (datacompy.polars.polarscompare method)": [[0, "datacompy.polars.PolarsCompare.all_columns_match", false]], "all_columns_match() (datacompy.polarscompare method)": [[0, "datacompy.PolarsCompare.all_columns_match", false]], "all_columns_match() (datacompy.spark.pandas.sparkpandascompare method)": [[1, "datacompy.spark.pandas.SparkPandasCompare.all_columns_match", false]], "all_columns_match() (datacompy.spark.sql.sparksqlcompare method)": [[1, "datacompy.spark.sql.SparkSQLCompare.all_columns_match", false]], "all_columns_match() (datacompy.sparkpandascompare method)": [[0, "datacompy.SparkPandasCompare.all_columns_match", false]], "all_columns_match() (datacompy.sparksqlcompare method)": [[0, "datacompy.SparkSQLCompare.all_columns_match", false]], "all_columns_match() (in module datacompy)": [[0, "datacompy.all_columns_match", false]], "all_columns_match() (in module datacompy.fugue)": [[0, "datacompy.fugue.all_columns_match", false]], "all_mismatch() (datacompy.base.basecompare method)": [[0, "datacompy.base.BaseCompare.all_mismatch", false]], "all_mismatch() (datacompy.basecompare method)": [[0, "datacompy.BaseCompare.all_mismatch", false]], "all_mismatch() (datacompy.compare method)": [[0, "datacompy.Compare.all_mismatch", false]], "all_mismatch() (datacompy.core.compare method)": [[0, "datacompy.core.Compare.all_mismatch", false]], "all_mismatch() (datacompy.polars.polarscompare method)": [[0, "datacompy.polars.PolarsCompare.all_mismatch", false]], "all_mismatch() (datacompy.polarscompare method)": [[0, "datacompy.PolarsCompare.all_mismatch", false]], "all_mismatch() (datacompy.spark.pandas.sparkpandascompare method)": [[1, "datacompy.spark.pandas.SparkPandasCompare.all_mismatch", false]], "all_mismatch() (datacompy.spark.sql.sparksqlcompare method)": [[1, "datacompy.spark.sql.SparkSQLCompare.all_mismatch", false]], "all_mismatch() (datacompy.sparkpandascompare method)": [[0, "datacompy.SparkPandasCompare.all_mismatch", false]], "all_mismatch() (datacompy.sparksqlcompare method)": [[0, "datacompy.SparkSQLCompare.all_mismatch", false]], "all_rows_overlap() (datacompy.base.basecompare method)": [[0, "datacompy.base.BaseCompare.all_rows_overlap", false]], "all_rows_overlap() (datacompy.basecompare method)": [[0, "datacompy.BaseCompare.all_rows_overlap", false]], "all_rows_overlap() (datacompy.compare method)": [[0, "datacompy.Compare.all_rows_overlap", false]], "all_rows_overlap() (datacompy.core.compare method)": [[0, "datacompy.core.Compare.all_rows_overlap", false]], "all_rows_overlap() (datacompy.polars.polarscompare method)": [[0, "datacompy.polars.PolarsCompare.all_rows_overlap", false]], "all_rows_overlap() (datacompy.polarscompare method)": [[0, "datacompy.PolarsCompare.all_rows_overlap", false]], "all_rows_overlap() (datacompy.spark.pandas.sparkpandascompare method)": [[1, "datacompy.spark.pandas.SparkPandasCompare.all_rows_overlap", false]], "all_rows_overlap() (datacompy.spark.sql.sparksqlcompare method)": [[1, "datacompy.spark.sql.SparkSQLCompare.all_rows_overlap", false]], "all_rows_overlap() (datacompy.sparkpandascompare method)": [[0, "datacompy.SparkPandasCompare.all_rows_overlap", false]], "all_rows_overlap() (datacompy.sparksqlcompare method)": [[0, "datacompy.SparkSQLCompare.all_rows_overlap", false]], "all_rows_overlap() (in module datacompy)": [[0, "datacompy.all_rows_overlap", false]], "all_rows_overlap() (in module datacompy.fugue)": [[0, "datacompy.fugue.all_rows_overlap", false]], "base_row_count (datacompy.spark.legacy.legacysparkcompare property)": [[1, "datacompy.spark.legacy.LegacySparkCompare.base_row_count", false]], "basecompare (class in datacompy)": [[0, "datacompy.BaseCompare", false]], "basecompare (class in datacompy.base)": [[0, "datacompy.base.BaseCompare", false]], "calculate_max_diff() (in module datacompy)": [[0, "datacompy.calculate_max_diff", false]], "calculate_max_diff() (in module datacompy.core)": [[0, "datacompy.core.calculate_max_diff", false]], "calculate_max_diff() (in module datacompy.polars)": [[0, "datacompy.polars.calculate_max_diff", false]], "calculate_max_diff() (in module datacompy.spark.pandas)": [[1, "datacompy.spark.pandas.calculate_max_diff", false]], "calculate_max_diff() (in module datacompy.spark.sql)": [[1, "datacompy.spark.sql.calculate_max_diff", false]], "calculate_null_diff() (in module datacompy.spark.sql)": [[1, "datacompy.spark.sql.calculate_null_diff", false]], "columns_compared (datacompy.spark.legacy.legacysparkcompare property)": [[1, "datacompy.spark.legacy.LegacySparkCompare.columns_compared", false]], "columns_equal() (in module datacompy)": [[0, "datacompy.columns_equal", false]], "columns_equal() (in module datacompy.core)": [[0, "datacompy.core.columns_equal", false]], "columns_equal() (in module datacompy.polars)": [[0, "datacompy.polars.columns_equal", false]], "columns_equal() (in module datacompy.spark.pandas)": [[1, "datacompy.spark.pandas.columns_equal", false]], "columns_equal() (in module datacompy.spark.sql)": [[1, "datacompy.spark.sql.columns_equal", false]], "columns_in_both (datacompy.spark.legacy.legacysparkcompare property)": [[1, "datacompy.spark.legacy.LegacySparkCompare.columns_in_both", false]], "columns_only_base (datacompy.spark.legacy.legacysparkcompare property)": [[1, "datacompy.spark.legacy.LegacySparkCompare.columns_only_base", false]], "columns_only_compare (datacompy.spark.legacy.legacysparkcompare property)": [[1, "datacompy.spark.legacy.LegacySparkCompare.columns_only_compare", false]], "common_row_count (datacompy.spark.legacy.legacysparkcompare property)": [[1, "datacompy.spark.legacy.LegacySparkCompare.common_row_count", false]], "compare (class in datacompy)": [[0, "datacompy.Compare", false]], "compare (class in datacompy.core)": [[0, "datacompy.core.Compare", false]], "compare_row_count (datacompy.spark.legacy.legacysparkcompare property)": [[1, "datacompy.spark.legacy.LegacySparkCompare.compare_row_count", false]], "compare_string_and_date_columns() (in module datacompy)": [[0, "datacompy.compare_string_and_date_columns", false]], "compare_string_and_date_columns() (in module datacompy.core)": [[0, "datacompy.core.compare_string_and_date_columns", false]], "compare_string_and_date_columns() (in module datacompy.polars)": [[0, "datacompy.polars.compare_string_and_date_columns", false]], "compare_string_and_date_columns() (in module datacompy.spark.pandas)": [[1, "datacompy.spark.pandas.compare_string_and_date_columns", false]], "count_matching_rows() (datacompy.base.basecompare method)": [[0, "datacompy.base.BaseCompare.count_matching_rows", false]], "count_matching_rows() (datacompy.basecompare method)": [[0, "datacompy.BaseCompare.count_matching_rows", false]], "count_matching_rows() (datacompy.compare method)": [[0, "datacompy.Compare.count_matching_rows", false]], "count_matching_rows() (datacompy.core.compare method)": [[0, "datacompy.core.Compare.count_matching_rows", false]], "count_matching_rows() (datacompy.polars.polarscompare method)": [[0, "datacompy.polars.PolarsCompare.count_matching_rows", false]], "count_matching_rows() (datacompy.polarscompare method)": [[0, "datacompy.PolarsCompare.count_matching_rows", false]], "count_matching_rows() (datacompy.spark.pandas.sparkpandascompare method)": [[1, "datacompy.spark.pandas.SparkPandasCompare.count_matching_rows", false]], "count_matching_rows() (datacompy.spark.sql.sparksqlcompare method)": [[1, "datacompy.spark.sql.SparkSQLCompare.count_matching_rows", false]], "count_matching_rows() (datacompy.sparkpandascompare method)": [[0, "datacompy.SparkPandasCompare.count_matching_rows", false]], "count_matching_rows() (datacompy.sparksqlcompare method)": [[0, "datacompy.SparkSQLCompare.count_matching_rows", false]], "count_matching_rows() (in module datacompy)": [[0, "datacompy.count_matching_rows", false]], "count_matching_rows() (in module datacompy.fugue)": [[0, "datacompy.fugue.count_matching_rows", false]], "datacompy": [[0, "module-datacompy", false]], "datacompy.base": [[0, "module-datacompy.base", false]], "datacompy.core": [[0, "module-datacompy.core", false]], "datacompy.fugue": [[0, "module-datacompy.fugue", false]], "datacompy.polars": [[0, "module-datacompy.polars", false]], "datacompy.spark": [[1, "module-datacompy.spark", false]], "datacompy.spark.legacy": [[1, "module-datacompy.spark.legacy", false]], "datacompy.spark.pandas": [[1, "module-datacompy.spark.pandas", false]], "datacompy.spark.sql": [[1, "module-datacompy.spark.sql", false]], "decimal_comparator() (in module datacompy.spark.legacy)": [[1, "datacompy.spark.legacy.decimal_comparator", false]], "decimal_comparator() (in module datacompy.spark.sql)": [[1, "datacompy.spark.sql.decimal_comparator", false]], "df1 (datacompy.base.basecompare property)": [[0, "datacompy.base.BaseCompare.df1", false]], "df1 (datacompy.basecompare property)": [[0, "datacompy.BaseCompare.df1", false]], "df1 (datacompy.compare property)": [[0, "datacompy.Compare.df1", false]], "df1 (datacompy.core.compare property)": [[0, "datacompy.core.Compare.df1", false]], "df1 (datacompy.polars.polarscompare property)": [[0, "datacompy.polars.PolarsCompare.df1", false]], "df1 (datacompy.polarscompare property)": [[0, "datacompy.PolarsCompare.df1", false]], "df1 (datacompy.spark.pandas.sparkpandascompare property)": [[1, "datacompy.spark.pandas.SparkPandasCompare.df1", false]], "df1 (datacompy.spark.sql.sparksqlcompare property)": [[1, "datacompy.spark.sql.SparkSQLCompare.df1", false]], "df1 (datacompy.sparkpandascompare property)": [[0, "datacompy.SparkPandasCompare.df1", false]], "df1 (datacompy.sparksqlcompare property)": [[0, "datacompy.SparkSQLCompare.df1", false]], "df1_unq_columns() (datacompy.base.basecompare method)": [[0, "datacompy.base.BaseCompare.df1_unq_columns", false]], "df1_unq_columns() (datacompy.basecompare method)": [[0, "datacompy.BaseCompare.df1_unq_columns", false]], "df1_unq_columns() (datacompy.compare method)": [[0, "datacompy.Compare.df1_unq_columns", false]], "df1_unq_columns() (datacompy.core.compare method)": [[0, "datacompy.core.Compare.df1_unq_columns", false]], "df1_unq_columns() (datacompy.polars.polarscompare method)": [[0, "datacompy.polars.PolarsCompare.df1_unq_columns", false]], "df1_unq_columns() (datacompy.polarscompare method)": [[0, "datacompy.PolarsCompare.df1_unq_columns", false]], "df1_unq_columns() (datacompy.spark.pandas.sparkpandascompare method)": [[1, "datacompy.spark.pandas.SparkPandasCompare.df1_unq_columns", false]], "df1_unq_columns() (datacompy.spark.sql.sparksqlcompare method)": [[1, "datacompy.spark.sql.SparkSQLCompare.df1_unq_columns", false]], "df1_unq_columns() (datacompy.sparkpandascompare method)": [[0, "datacompy.SparkPandasCompare.df1_unq_columns", false]], "df1_unq_columns() (datacompy.sparksqlcompare method)": [[0, "datacompy.SparkSQLCompare.df1_unq_columns", false]], "df2 (datacompy.base.basecompare property)": [[0, "datacompy.base.BaseCompare.df2", false]], "df2 (datacompy.basecompare property)": [[0, "datacompy.BaseCompare.df2", false]], "df2 (datacompy.compare property)": [[0, "datacompy.Compare.df2", false]], "df2 (datacompy.core.compare property)": [[0, "datacompy.core.Compare.df2", false]], "df2 (datacompy.polars.polarscompare property)": [[0, "datacompy.polars.PolarsCompare.df2", false]], "df2 (datacompy.polarscompare property)": [[0, "datacompy.PolarsCompare.df2", false]], "df2 (datacompy.spark.pandas.sparkpandascompare property)": [[1, "datacompy.spark.pandas.SparkPandasCompare.df2", false]], "df2 (datacompy.spark.sql.sparksqlcompare property)": [[1, "datacompy.spark.sql.SparkSQLCompare.df2", false]], "df2 (datacompy.sparkpandascompare property)": [[0, "datacompy.SparkPandasCompare.df2", false]], "df2 (datacompy.sparksqlcompare property)": [[0, "datacompy.SparkSQLCompare.df2", false]], "df2_unq_columns() (datacompy.base.basecompare method)": [[0, "datacompy.base.BaseCompare.df2_unq_columns", false]], "df2_unq_columns() (datacompy.basecompare method)": [[0, "datacompy.BaseCompare.df2_unq_columns", false]], "df2_unq_columns() (datacompy.compare method)": [[0, "datacompy.Compare.df2_unq_columns", false]], "df2_unq_columns() (datacompy.core.compare method)": [[0, "datacompy.core.Compare.df2_unq_columns", false]], "df2_unq_columns() (datacompy.polars.polarscompare method)": [[0, "datacompy.polars.PolarsCompare.df2_unq_columns", false]], "df2_unq_columns() (datacompy.polarscompare method)": [[0, "datacompy.PolarsCompare.df2_unq_columns", false]], "df2_unq_columns() (datacompy.spark.pandas.sparkpandascompare method)": [[1, "datacompy.spark.pandas.SparkPandasCompare.df2_unq_columns", false]], "df2_unq_columns() (datacompy.spark.sql.sparksqlcompare method)": [[1, "datacompy.spark.sql.SparkSQLCompare.df2_unq_columns", false]], "df2_unq_columns() (datacompy.sparkpandascompare method)": [[0, "datacompy.SparkPandasCompare.df2_unq_columns", false]], "df2_unq_columns() (datacompy.sparksqlcompare method)": [[0, "datacompy.SparkSQLCompare.df2_unq_columns", false]], "generate_id_within_group() (in module datacompy)": [[0, "datacompy.generate_id_within_group", false]], "generate_id_within_group() (in module datacompy.core)": [[0, "datacompy.core.generate_id_within_group", false]], "generate_id_within_group() (in module datacompy.polars)": [[0, "datacompy.polars.generate_id_within_group", false]], "generate_id_within_group() (in module datacompy.spark.pandas)": [[1, "datacompy.spark.pandas.generate_id_within_group", false]], "get_merged_columns() (in module datacompy)": [[0, "datacompy.get_merged_columns", false]], "get_merged_columns() (in module datacompy.core)": [[0, "datacompy.core.get_merged_columns", false]], "get_merged_columns() (in module datacompy.polars)": [[0, "datacompy.polars.get_merged_columns", false]], "get_merged_columns() (in module datacompy.spark.pandas)": [[1, "datacompy.spark.pandas.get_merged_columns", false]], "get_merged_columns() (in module datacompy.spark.sql)": [[1, "datacompy.spark.sql.get_merged_columns", false]], "intersect_columns() (datacompy.base.basecompare method)": [[0, "datacompy.base.BaseCompare.intersect_columns", false]], "intersect_columns() (datacompy.basecompare method)": [[0, "datacompy.BaseCompare.intersect_columns", false]], "intersect_columns() (datacompy.compare method)": [[0, "datacompy.Compare.intersect_columns", false]], "intersect_columns() (datacompy.core.compare method)": [[0, "datacompy.core.Compare.intersect_columns", false]], "intersect_columns() (datacompy.polars.polarscompare method)": [[0, "datacompy.polars.PolarsCompare.intersect_columns", false]], "intersect_columns() (datacompy.polarscompare method)": [[0, "datacompy.PolarsCompare.intersect_columns", false]], "intersect_columns() (datacompy.spark.pandas.sparkpandascompare method)": [[1, "datacompy.spark.pandas.SparkPandasCompare.intersect_columns", false]], "intersect_columns() (datacompy.spark.sql.sparksqlcompare method)": [[1, "datacompy.spark.sql.SparkSQLCompare.intersect_columns", false]], "intersect_columns() (datacompy.sparkpandascompare method)": [[0, "datacompy.SparkPandasCompare.intersect_columns", false]], "intersect_columns() (datacompy.sparksqlcompare method)": [[0, "datacompy.SparkSQLCompare.intersect_columns", false]], "intersect_columns() (in module datacompy)": [[0, "datacompy.intersect_columns", false]], "intersect_columns() (in module datacompy.fugue)": [[0, "datacompy.fugue.intersect_columns", false]], "intersect_rows_match() (datacompy.base.basecompare method)": [[0, "datacompy.base.BaseCompare.intersect_rows_match", false]], "intersect_rows_match() (datacompy.basecompare method)": [[0, "datacompy.BaseCompare.intersect_rows_match", false]], "intersect_rows_match() (datacompy.compare method)": [[0, "datacompy.Compare.intersect_rows_match", false]], "intersect_rows_match() (datacompy.core.compare method)": [[0, "datacompy.core.Compare.intersect_rows_match", false]], "intersect_rows_match() (datacompy.polars.polarscompare method)": [[0, "datacompy.polars.PolarsCompare.intersect_rows_match", false]], "intersect_rows_match() (datacompy.polarscompare method)": [[0, "datacompy.PolarsCompare.intersect_rows_match", false]], "intersect_rows_match() (datacompy.spark.pandas.sparkpandascompare method)": [[1, "datacompy.spark.pandas.SparkPandasCompare.intersect_rows_match", false]], "intersect_rows_match() (datacompy.spark.sql.sparksqlcompare method)": [[1, "datacompy.spark.sql.SparkSQLCompare.intersect_rows_match", false]], "intersect_rows_match() (datacompy.sparkpandascompare method)": [[0, "datacompy.SparkPandasCompare.intersect_rows_match", false]], "intersect_rows_match() (datacompy.sparksqlcompare method)": [[0, "datacompy.SparkSQLCompare.intersect_rows_match", false]], "is_match() (in module datacompy)": [[0, "datacompy.is_match", false]], "is_match() (in module datacompy.fugue)": [[0, "datacompy.fugue.is_match", false]], "known_difference (datacompy.spark.legacy.matchtype attribute)": [[1, "datacompy.spark.legacy.MatchType.KNOWN_DIFFERENCE", false]], "legacysparkcompare (class in datacompy.spark.legacy)": [[1, "datacompy.spark.legacy.LegacySparkCompare", false]], "match (datacompy.spark.legacy.matchtype attribute)": [[1, "datacompy.spark.legacy.MatchType.MATCH", false]], "matches() (datacompy.base.basecompare method)": [[0, "datacompy.base.BaseCompare.matches", false]], "matches() (datacompy.basecompare method)": [[0, "datacompy.BaseCompare.matches", false]], "matches() (datacompy.compare method)": [[0, "datacompy.Compare.matches", false]], "matches() (datacompy.core.compare method)": [[0, "datacompy.core.Compare.matches", false]], "matches() (datacompy.polars.polarscompare method)": [[0, "datacompy.polars.PolarsCompare.matches", false]], "matches() (datacompy.polarscompare method)": [[0, "datacompy.PolarsCompare.matches", false]], "matches() (datacompy.spark.pandas.sparkpandascompare method)": [[1, "datacompy.spark.pandas.SparkPandasCompare.matches", false]], "matches() (datacompy.spark.sql.sparksqlcompare method)": [[1, "datacompy.spark.sql.SparkSQLCompare.matches", false]], "matches() (datacompy.sparkpandascompare method)": [[0, "datacompy.SparkPandasCompare.matches", false]], "matches() (datacompy.sparksqlcompare method)": [[0, "datacompy.SparkSQLCompare.matches", false]], "matchtype (class in datacompy.spark.legacy)": [[1, "datacompy.spark.legacy.MatchType", false]], "mismatch (datacompy.spark.legacy.matchtype attribute)": [[1, "datacompy.spark.legacy.MatchType.MISMATCH", false]], "module": [[0, "module-datacompy", false], [0, "module-datacompy.base", false], [0, "module-datacompy.core", false], [0, "module-datacompy.fugue", false], [0, "module-datacompy.polars", false], [1, "module-datacompy.spark", false], [1, "module-datacompy.spark.legacy", false], [1, "module-datacompy.spark.pandas", false], [1, "module-datacompy.spark.sql", false]], "polarscompare (class in datacompy)": [[0, "datacompy.PolarsCompare", false]], "polarscompare (class in datacompy.polars)": [[0, "datacompy.polars.PolarsCompare", false]], "render() (in module datacompy)": [[0, "datacompy.render", false]], "render() (in module datacompy.core)": [[0, "datacompy.core.render", false]], "render() (in module datacompy.polars)": [[0, "datacompy.polars.render", false]], "render() (in module datacompy.spark.pandas)": [[1, "datacompy.spark.pandas.render", false]], "render() (in module datacompy.spark.sql)": [[1, "datacompy.spark.sql.render", false]], "report() (datacompy.base.basecompare method)": [[0, "datacompy.base.BaseCompare.report", false]], "report() (datacompy.basecompare method)": [[0, "datacompy.BaseCompare.report", false]], "report() (datacompy.compare method)": [[0, "datacompy.Compare.report", false]], "report() (datacompy.core.compare method)": [[0, "datacompy.core.Compare.report", false]], "report() (datacompy.polars.polarscompare method)": [[0, "datacompy.polars.PolarsCompare.report", false]], "report() (datacompy.polarscompare method)": [[0, "datacompy.PolarsCompare.report", false]], "report() (datacompy.spark.legacy.legacysparkcompare method)": [[1, "datacompy.spark.legacy.LegacySparkCompare.report", false]], "report() (datacompy.spark.pandas.sparkpandascompare method)": [[1, "datacompy.spark.pandas.SparkPandasCompare.report", false]], "report() (datacompy.spark.sql.sparksqlcompare method)": [[1, "datacompy.spark.sql.SparkSQLCompare.report", false]], "report() (datacompy.sparkpandascompare method)": [[0, "datacompy.SparkPandasCompare.report", false]], "report() (datacompy.sparksqlcompare method)": [[0, "datacompy.SparkSQLCompare.report", false]], "report() (in module datacompy)": [[0, "datacompy.report", false]], "report() (in module datacompy.fugue)": [[0, "datacompy.fugue.report", false]], "rows_both_all (datacompy.spark.legacy.legacysparkcompare property)": [[1, "datacompy.spark.legacy.LegacySparkCompare.rows_both_all", false]], "rows_both_mismatch (datacompy.spark.legacy.legacysparkcompare property)": [[1, "datacompy.spark.legacy.LegacySparkCompare.rows_both_mismatch", false]], "rows_only_base (datacompy.spark.legacy.legacysparkcompare property)": [[1, "datacompy.spark.legacy.LegacySparkCompare.rows_only_base", false]], "rows_only_compare (datacompy.spark.legacy.legacysparkcompare property)": [[1, "datacompy.spark.legacy.LegacySparkCompare.rows_only_compare", false]], "sample_mismatch() (datacompy.base.basecompare method)": [[0, "datacompy.base.BaseCompare.sample_mismatch", false]], "sample_mismatch() (datacompy.basecompare method)": [[0, "datacompy.BaseCompare.sample_mismatch", false]], "sample_mismatch() (datacompy.compare method)": [[0, "datacompy.Compare.sample_mismatch", false]], "sample_mismatch() (datacompy.core.compare method)": [[0, "datacompy.core.Compare.sample_mismatch", false]], "sample_mismatch() (datacompy.polars.polarscompare method)": [[0, "datacompy.polars.PolarsCompare.sample_mismatch", false]], "sample_mismatch() (datacompy.polarscompare method)": [[0, "datacompy.PolarsCompare.sample_mismatch", false]], "sample_mismatch() (datacompy.spark.pandas.sparkpandascompare method)": [[1, "datacompy.spark.pandas.SparkPandasCompare.sample_mismatch", false]], "sample_mismatch() (datacompy.spark.sql.sparksqlcompare method)": [[1, "datacompy.spark.sql.SparkSQLCompare.sample_mismatch", false]], "sample_mismatch() (datacompy.sparkpandascompare method)": [[0, "datacompy.SparkPandasCompare.sample_mismatch", false]], "sample_mismatch() (datacompy.sparksqlcompare method)": [[0, "datacompy.SparkSQLCompare.sample_mismatch", false]], "sparkpandascompare (class in datacompy)": [[0, "datacompy.SparkPandasCompare", false]], "sparkpandascompare (class in datacompy.spark.pandas)": [[1, "datacompy.spark.pandas.SparkPandasCompare", false]], "sparksqlcompare (class in datacompy)": [[0, "datacompy.SparkSQLCompare", false]], "sparksqlcompare (class in datacompy.spark.sql)": [[1, "datacompy.spark.sql.SparkSQLCompare", false]], "subset() (datacompy.base.basecompare method)": [[0, "datacompy.base.BaseCompare.subset", false]], "subset() (datacompy.basecompare method)": [[0, "datacompy.BaseCompare.subset", false]], "subset() (datacompy.compare method)": [[0, "datacompy.Compare.subset", false]], "subset() (datacompy.core.compare method)": [[0, "datacompy.core.Compare.subset", false]], "subset() (datacompy.polars.polarscompare method)": [[0, "datacompy.polars.PolarsCompare.subset", false]], "subset() (datacompy.polarscompare method)": [[0, "datacompy.PolarsCompare.subset", false]], "subset() (datacompy.spark.pandas.sparkpandascompare method)": [[1, "datacompy.spark.pandas.SparkPandasCompare.subset", false]], "subset() (datacompy.spark.sql.sparksqlcompare method)": [[1, "datacompy.spark.sql.SparkSQLCompare.subset", false]], "subset() (datacompy.sparkpandascompare method)": [[0, "datacompy.SparkPandasCompare.subset", false]], "subset() (datacompy.sparksqlcompare method)": [[0, "datacompy.SparkSQLCompare.subset", false]], "temp_column_name() (in module datacompy)": [[0, "datacompy.temp_column_name", false]], "temp_column_name() (in module datacompy.base)": [[0, "datacompy.base.temp_column_name", false]], "unq_columns() (in module datacompy)": [[0, "datacompy.unq_columns", false]], "unq_columns() (in module datacompy.fugue)": [[0, "datacompy.fugue.unq_columns", false]]}, "objects": {"": [[0, 0, 0, "-", "datacompy"]], "datacompy": [[0, 1, 1, "", "BaseCompare"], [0, 1, 1, "", "Compare"], [0, 1, 1, "", "PolarsCompare"], [0, 1, 1, "", "SparkPandasCompare"], [0, 1, 1, "", "SparkSQLCompare"], [0, 4, 1, "", "all_columns_match"], [0, 4, 1, "", "all_rows_overlap"], [0, 0, 0, "-", "base"], [0, 4, 1, "", "calculate_max_diff"], [0, 4, 1, "", "columns_equal"], [0, 4, 1, "", "compare_string_and_date_columns"], [0, 0, 0, "-", "core"], [0, 4, 1, "", "count_matching_rows"], [0, 0, 0, "-", "fugue"], [0, 4, 1, "", "generate_id_within_group"], [0, 4, 1, "", "get_merged_columns"], [0, 4, 1, "", "intersect_columns"], [0, 4, 1, "", "is_match"], [0, 0, 0, "-", "polars"], [0, 4, 1, "", "render"], [0, 4, 1, "", "report"], [1, 0, 0, "-", "spark"], [0, 4, 1, "", "temp_column_name"], [0, 4, 1, "", "unq_columns"]], "datacompy.BaseCompare": [[0, 2, 1, "", "all_columns_match"], [0, 2, 1, "", "all_mismatch"], [0, 2, 1, "", "all_rows_overlap"], [0, 2, 1, "", "count_matching_rows"], [0, 3, 1, "", "df1"], [0, 2, 1, "", "df1_unq_columns"], [0, 3, 1, "", "df2"], [0, 2, 1, "", "df2_unq_columns"], [0, 2, 1, "", "intersect_columns"], [0, 2, 1, "", "intersect_rows_match"], [0, 2, 1, "", "matches"], [0, 2, 1, "", "report"], [0, 2, 1, "", "sample_mismatch"], [0, 2, 1, "", "subset"]], "datacompy.Compare": [[0, 2, 1, "", "all_columns_match"], [0, 2, 1, "", "all_mismatch"], [0, 2, 1, "", "all_rows_overlap"], [0, 2, 1, "", "count_matching_rows"], [0, 3, 1, "", "df1"], [0, 2, 1, "", "df1_unq_columns"], [0, 3, 1, "", "df2"], [0, 2, 1, "", "df2_unq_columns"], [0, 2, 1, "", "intersect_columns"], [0, 2, 1, "", "intersect_rows_match"], [0, 2, 1, "", "matches"], [0, 2, 1, "", "report"], [0, 2, 1, "", "sample_mismatch"], [0, 2, 1, "", "subset"]], "datacompy.PolarsCompare": [[0, 2, 1, "", "all_columns_match"], [0, 2, 1, "", "all_mismatch"], [0, 2, 1, "", "all_rows_overlap"], [0, 2, 1, "", "count_matching_rows"], [0, 3, 1, "", "df1"], [0, 2, 1, "", "df1_unq_columns"], [0, 3, 1, "", "df2"], [0, 2, 1, "", "df2_unq_columns"], [0, 2, 1, "", "intersect_columns"], [0, 2, 1, "", "intersect_rows_match"], [0, 2, 1, "", "matches"], [0, 2, 1, "", "report"], [0, 2, 1, "", "sample_mismatch"], [0, 2, 1, "", "subset"]], "datacompy.SparkPandasCompare": [[0, 2, 1, "", "all_columns_match"], [0, 2, 1, "", "all_mismatch"], [0, 2, 1, "", "all_rows_overlap"], [0, 2, 1, "", "count_matching_rows"], [0, 3, 1, "", "df1"], [0, 2, 1, "", "df1_unq_columns"], [0, 3, 1, "", "df2"], [0, 2, 1, "", "df2_unq_columns"], [0, 2, 1, "", "intersect_columns"], [0, 2, 1, "", "intersect_rows_match"], [0, 2, 1, "", "matches"], [0, 2, 1, "", "report"], [0, 2, 1, "", "sample_mismatch"], [0, 2, 1, "", "subset"]], "datacompy.SparkSQLCompare": [[0, 2, 1, "", "all_columns_match"], [0, 2, 1, "", "all_mismatch"], [0, 2, 1, "", "all_rows_overlap"], [0, 2, 1, "", "count_matching_rows"], [0, 3, 1, "", "df1"], [0, 2, 1, "", "df1_unq_columns"], [0, 3, 1, "", "df2"], [0, 2, 1, "", "df2_unq_columns"], [0, 2, 1, "", "intersect_columns"], [0, 2, 1, "", "intersect_rows_match"], [0, 2, 1, "", "matches"], [0, 2, 1, "", "report"], [0, 2, 1, "", "sample_mismatch"], [0, 2, 1, "", "subset"]], "datacompy.base": [[0, 1, 1, "", "BaseCompare"], [0, 4, 1, "", "temp_column_name"]], "datacompy.base.BaseCompare": [[0, 2, 1, "", "all_columns_match"], [0, 2, 1, "", "all_mismatch"], [0, 2, 1, "", "all_rows_overlap"], [0, 2, 1, "", "count_matching_rows"], [0, 3, 1, "", "df1"], [0, 2, 1, "", "df1_unq_columns"], [0, 3, 1, "", "df2"], [0, 2, 1, "", "df2_unq_columns"], [0, 2, 1, "", "intersect_columns"], [0, 2, 1, "", "intersect_rows_match"], [0, 2, 1, "", "matches"], [0, 2, 1, "", "report"], [0, 2, 1, "", "sample_mismatch"], [0, 2, 1, "", "subset"]], "datacompy.core": [[0, 1, 1, "", "Compare"], [0, 4, 1, "", "calculate_max_diff"], [0, 4, 1, "", "columns_equal"], [0, 4, 1, "", "compare_string_and_date_columns"], [0, 4, 1, "", "generate_id_within_group"], [0, 4, 1, "", "get_merged_columns"], [0, 4, 1, "", "render"]], "datacompy.core.Compare": [[0, 2, 1, "", "all_columns_match"], [0, 2, 1, "", "all_mismatch"], [0, 2, 1, "", "all_rows_overlap"], [0, 2, 1, "", "count_matching_rows"], [0, 3, 1, "", "df1"], [0, 2, 1, "", "df1_unq_columns"], [0, 3, 1, "", "df2"], [0, 2, 1, "", "df2_unq_columns"], [0, 2, 1, "", "intersect_columns"], [0, 2, 1, "", "intersect_rows_match"], [0, 2, 1, "", "matches"], [0, 2, 1, "", "report"], [0, 2, 1, "", "sample_mismatch"], [0, 2, 1, "", "subset"]], "datacompy.fugue": [[0, 4, 1, "", "all_columns_match"], [0, 4, 1, "", "all_rows_overlap"], [0, 4, 1, "", "count_matching_rows"], [0, 4, 1, "", "intersect_columns"], [0, 4, 1, "", "is_match"], [0, 4, 1, "", "report"], [0, 4, 1, "", "unq_columns"]], "datacompy.polars": [[0, 1, 1, "", "PolarsCompare"], [0, 4, 1, "", "calculate_max_diff"], [0, 4, 1, "", "columns_equal"], [0, 4, 1, "", "compare_string_and_date_columns"], [0, 4, 1, "", "generate_id_within_group"], [0, 4, 1, "", "get_merged_columns"], [0, 4, 1, "", "render"]], "datacompy.polars.PolarsCompare": [[0, 2, 1, "", "all_columns_match"], [0, 2, 1, "", "all_mismatch"], [0, 2, 1, "", "all_rows_overlap"], [0, 2, 1, "", "count_matching_rows"], [0, 3, 1, "", "df1"], [0, 2, 1, "", "df1_unq_columns"], [0, 3, 1, "", "df2"], [0, 2, 1, "", "df2_unq_columns"], [0, 2, 1, "", "intersect_columns"], [0, 2, 1, "", "intersect_rows_match"], [0, 2, 1, "", "matches"], [0, 2, 1, "", "report"], [0, 2, 1, "", "sample_mismatch"], [0, 2, 1, "", "subset"]], "datacompy.spark": [[1, 0, 0, "-", "legacy"], [1, 0, 0, "-", "pandas"], [1, 0, 0, "-", "sql"]], "datacompy.spark.legacy": [[1, 1, 1, "", "LegacySparkCompare"], [1, 1, 1, "", "MatchType"], [1, 4, 1, "", "decimal_comparator"]], "datacompy.spark.legacy.LegacySparkCompare": [[1, 3, 1, "", "base_row_count"], [1, 3, 1, "", "columns_compared"], [1, 3, 1, "", "columns_in_both"], [1, 3, 1, "", "columns_only_base"], [1, 3, 1, "", "columns_only_compare"], [1, 3, 1, "", "common_row_count"], [1, 3, 1, "", "compare_row_count"], [1, 2, 1, "", "report"], [1, 3, 1, "", "rows_both_all"], [1, 3, 1, "", "rows_both_mismatch"], [1, 3, 1, "", "rows_only_base"], [1, 3, 1, "", "rows_only_compare"]], "datacompy.spark.legacy.MatchType": [[1, 5, 1, "", "KNOWN_DIFFERENCE"], [1, 5, 1, "", "MATCH"], [1, 5, 1, "", "MISMATCH"]], "datacompy.spark.pandas": [[1, 1, 1, "", "SparkPandasCompare"], [1, 4, 1, "", "calculate_max_diff"], [1, 4, 1, "", "columns_equal"], [1, 4, 1, "", "compare_string_and_date_columns"], [1, 4, 1, "", "generate_id_within_group"], [1, 4, 1, "", "get_merged_columns"], [1, 4, 1, "", "render"]], "datacompy.spark.pandas.SparkPandasCompare": [[1, 2, 1, "", "all_columns_match"], [1, 2, 1, "", "all_mismatch"], [1, 2, 1, "", "all_rows_overlap"], [1, 2, 1, "", "count_matching_rows"], [1, 3, 1, "", "df1"], [1, 2, 1, "", "df1_unq_columns"], [1, 3, 1, "", "df2"], [1, 2, 1, "", "df2_unq_columns"], [1, 2, 1, "", "intersect_columns"], [1, 2, 1, "", "intersect_rows_match"], [1, 2, 1, "", "matches"], [1, 2, 1, "", "report"], [1, 2, 1, "", "sample_mismatch"], [1, 2, 1, "", "subset"]], "datacompy.spark.sql": [[1, 1, 1, "", "SparkSQLCompare"], [1, 4, 1, "", "calculate_max_diff"], [1, 4, 1, "", "calculate_null_diff"], [1, 4, 1, "", "columns_equal"], [1, 4, 1, "", "decimal_comparator"], [1, 4, 1, "", "get_merged_columns"], [1, 4, 1, "", "render"]], "datacompy.spark.sql.SparkSQLCompare": [[1, 2, 1, "", "all_columns_match"], [1, 2, 1, "", "all_mismatch"], [1, 2, 1, "", "all_rows_overlap"], [1, 2, 1, "", "count_matching_rows"], [1, 3, 1, "", "df1"], [1, 2, 1, "", "df1_unq_columns"], [1, 3, 1, "", "df2"], [1, 2, 1, "", "df2_unq_columns"], [1, 2, 1, "", "intersect_columns"], [1, 2, 1, "", "intersect_rows_match"], [1, 2, 1, "", "matches"], [1, 2, 1, "", "report"], [1, 2, 1, "", "sample_mismatch"], [1, 2, 1, "", "subset"]]}, "objnames": {"0": ["py", "module", "Python module"], "1": ["py", "class", "Python class"], "2": ["py", "method", "Python method"], "3": ["py", "property", "Python property"], "4": ["py", "function", "Python function"], "5": ["py", "attribute", "Python attribute"]}, "objtypes": {"0": "py:module", "1": "py:class", "2": "py:method", "3": "py:property", "4": "py:function", "5": "py:attribute"}, "terms": {"": [0, 1, 6, 8, 9, 10], "0": [0, 1, 3, 4, 5, 6, 8, 9, 10], "000": [3, 8, 9, 10], "0000": [8, 9, 10], "0001": [8, 9], "0005": [8, 9, 10], "01": [5, 8, 9, 10], "025": 3, "041": 3, "05": [5, 8, 9, 10], "0500": [8, 9, 10], "0701": 3, "1": [0, 1, 3, 4, 5, 6, 8, 9, 10], "10": [0, 1, 3, 5, 6, 8, 9, 10], "100": [1, 3], "1000": 3, "10000001234": [5, 8, 9, 10], "10000001235": [5, 8, 9, 10], "10000001236": [5, 8, 9, 10], "10000001237": [5, 8, 9, 10], "10000001238": [5, 8, 9, 10], "10000001239": [5, 10], "109": 3, "11": [3, 6, 9], "111": [5, 8, 9, 10], "1113": 3, "12": [5, 6, 7, 8, 9, 10], "120": 3, "123": [5, 8, 9, 10], "123456": [5, 8, 9, 10], "1257": 3, "127": 3, "13": [6, 10], "130": 3, "1345": [5, 8, 9, 10], "14": 0, "14530": [5, 8, 9, 10], "15": 3, "155": [5, 8, 9, 10], "1555": [5, 8, 9, 10], "16": 3, "17": 3, "175": 3, "18": 3, "193": 3, "194": 3, "196": 3, "2": [0, 1, 3, 6, 8, 9, 10], "20": 3, "2017": [5, 8, 9, 10], "21": 4, "2185": 3, "234": 3, "262": 3, "2763": 3, "2838": 3, "3": [3, 4, 6, 7, 8, 9, 10], "304": 3, "31": 3, "3112": 3, "3204": 3, "32gb": 3, "330": 3, "345": [5, 8, 9, 10], "4": [5, 6, 8, 9, 10], "44101": 10, "45": [5, 8, 9, 10], "455": 3, "47": 3, "494": 3, "5": [4, 6, 8, 9, 10], "50": 3, "500": 3, "560": 3, "57": 3, "5735": 3, "578": 3, "6": [3, 4, 8, 9, 10], "6094": 3, "62": 3, "6274": 3, "64gb": 3, "7": [4, 8], "743": 3, "8": [1, 3, 9], "804": 3, "827": 3, "9": [6, 7], "90": 3, "94": 3, "96": 3, "9814": 3, "A": [0, 1, 4, 7, 8, 9, 10], "And": [8, 10], "As": [0, 9], "At": 6, "By": [1, 6], "For": [4, 5, 8, 9, 10], "If": [0, 1, 3, 6, 7, 8, 10], "In": [4, 5, 8], "It": [3, 4, 8, 10], "No": 10, "OR": [8, 9], "The": [0, 1, 4, 5, 6, 8, 9, 10], "Then": [0, 4, 6], "There": [8, 9, 10], "To": [6, 10], "Will": [0, 1], "With": [5, 6, 10], "_df1": [0, 1], "_io": 1, "_merge_left": 10, "_merge_right": 10, "_temp_x": 0, "ab": [0, 1], "abc": 0, "abl": 3, "about": [4, 8], "abov": [4, 6, 7, 8, 9, 10], "abs_tol": [0, 1, 5, 8, 9, 10], "absolut": [0, 1, 8, 9, 10], "abstract": 0, "accept": [6, 10], "access": 5, "acct_id": [5, 8, 9, 10], "acct_id_df1": 10, "acct_id_df2": 10, "accur": [0, 6], "achiev": 5, "across": [5, 6], "action": 4, "activ": [4, 7], "actual": [0, 1], "ad": [0, 1, 4], "add": 7, "addit": 4, "adher": 6, "adopt": 5, "after": [4, 8, 9, 10], "again": [8, 10], "against": 1, "aggreg": 5, "agreement": 6, "align": [6, 10], "all": [0, 1, 4, 6, 7, 8, 9, 10], "all_columns_match": [0, 1, 2, 5, 6], "all_mismatch": [0, 1, 2], "all_rows_overlap": [0, 1, 2, 5, 6], "allow": [0, 1], "alreadi": [1, 8], "also": [1, 4, 5, 6, 8, 9, 10], "alwai": 3, "amount": [0, 1, 3], "an": [0, 1, 3, 9], "ani": [0, 1, 4, 6, 8, 9, 10], "anoth": [0, 1], "anydatafram": 0, "apach": [9, 10], "api": [4, 10], "apidoc": 4, "append": [0, 1], "appli": [0, 1], "appreci": 6, "ar": [0, 1, 4, 5, 6, 7, 8, 9, 10], "archiv": 6, "arr1": 8, "arr2": 8, "arrow": [5, 6, 9], "artifact": 4, "ask": 6, "assert_almost_equ": 8, "assert_array_equ": 8, "assert_frame_equ": 8, "assert_series_equ": 8, "attempt": [0, 1], "attribut": 10, "autom": 4, "automag": [0, 1], "automat": 4, "avail": [8, 9, 10], "awar": 9, "b": 1, "back": 4, "backend": 5, "background": 5, "base": [1, 2, 3, 4, 5, 6, 8], "base_column_nam": 1, "base_df": 1, "base_row_count": [0, 1], "basecompar": [0, 1, 2, 6], "basi": 1, "basic": [0, 1, 6], "been": [6, 8, 9, 10], "befor": [0, 1, 4, 6, 8, 10], "behaviour": [6, 9, 10], "behind": [4, 8, 10], "being": [1, 4], "below": [4, 6], "benchmark": 6, "benefit": 5, "best": 3, "better": [6, 10], "between": [0, 1, 8], "bias": 3, "bin": 7, "black": 4, "bluth": [5, 8, 9, 10], "bob": [5, 8, 9, 10], "bool": [0, 1, 9], "boolean": [0, 1], "both": [0, 1, 10], "boto3": 4, "branch": 4, "break": 4, "brows": 10, "build": 4, "builder": [5, 10], "c": 4, "cach": 1, "cache_intermedi": 1, "calculate_max_diff": [0, 1, 2, 6], "calculate_null_diff": [0, 1], "call": [8, 9, 10], "can": [0, 1, 3, 4, 5, 6, 8, 9, 10], "canon": 1, "capabl": 8, "carri": [0, 6], "case": [0, 1, 5], "cast": [0, 1], "cast_column_names_low": [0, 1], "caus": 1, "caveat": 6, "certain": 1, "chang": 4, "channel": 7, "check": [0, 1, 8], "checkout": 4, "choic": 8, "chunk": 5, "cla": 6, "class": [0, 1, 5, 6, 8, 10], "clean": 4, "coars": 5, "code": [4, 5, 6, 9], "cogroup": 5, "col_1": [0, 1], "col_2": [0, 1], "col_match": 1, "collaps": 4, "collect": 4, "column": [0, 1, 3, 5, 8, 9, 10], "column_count": [0, 1], "column_map": 1, "columnar": 9, "columns_compar": [0, 1], "columns_equ": [0, 1, 2, 6], "columns_in_both": [0, 1], "columns_map": 1, "columns_only_bas": [0, 1], "columns_only_compar": [0, 1], "combin": [8, 10], "come": [4, 8, 9], "command": [0, 1, 4], "commit": 6, "common": [1, 8, 9, 10], "common_row_count": [0, 1], "commun": [4, 5], "compar": [0, 1, 2, 3, 6, 10], "compare_column_nam": 1, "compare_df": 1, "compare_row_count": [0, 1], "compare_string_and_date_column": [0, 1, 2, 6], "comparin": 1, "comparison": [0, 1, 5, 8, 9, 10], "compat": [5, 6], "compris": 1, "conda": 6, "conduct": 6, "config": 7, "configur": 4, "consid": [0, 1, 9], "consist": [1, 3, 5, 6, 10], "constraint": 8, "contain": [0, 1, 8], "content": 2, "contribut": [3, 6], "control": [0, 1], "conveni": 6, "convent": 1, "convert": [0, 1, 8], "core": [2, 3, 4, 6], "correspond": [4, 5], "could": 8, "count": [0, 1], "count_matching_row": [0, 1, 2, 6], "cpu": 3, "creat": [0, 1, 3, 7], "createdatafram": [5, 10], "creation": [0, 1], "cross": 6, "current": [6, 8, 10], "dai": 4, "dask": [5, 6], "data": [0, 1, 5, 6, 8], "data1": [5, 8, 9, 10], "data2": [5, 8, 9, 10], "datacompi": [4, 5, 7, 8, 9, 10], "datacompy_nul": 8, "datafram": [0, 1, 3, 5, 6, 8, 9, 10], "dataset": [1, 3, 5, 8], "date": [0, 1, 4], "date_fld": [5, 8, 9, 10], "date_fld_df1": 10, "de": 1, "decim": [0, 1], "decimal_compar": [0, 1], "decis": 4, "dedup": 1, "dedupl": [0, 1], "default": [0, 1, 4, 5, 10], "defin": [1, 4], "denot": [1, 4], "depend": [4, 5, 6], "deprec": [5, 10], "describ": [1, 8], "detail": [4, 6], "dev": 4, "develop": 6, "df1": [0, 1, 2, 5, 8, 9, 10], "df1_name": [0, 1, 5, 8, 9, 10], "df1_unq_column": [0, 1, 2, 8, 9, 10], "df1_unq_row": [0, 1, 8, 9, 10], "df2": [0, 1, 2, 5, 8, 9, 10], "df2_name": [0, 1, 5, 8, 9, 10], "df2_unq_column": [0, 1, 2, 8, 9, 10], "df2_unq_row": [0, 1, 8, 9, 10], "dict": 1, "dictionari": 1, "did": 3, "diff": [1, 8, 9, 10], "differ": [0, 1, 5, 6, 8, 9, 10], "directli": 8, "directori": [0, 1, 4], "disconnect": 4, "disk": 8, "displai": [0, 1], "dist": 4, "distinguish": [0, 1], "distribut": [3, 6], "dnr": 3, "do": [1, 5], "doc": 4, "docstr": 4, "document": [6, 9], "doe": [8, 9, 10], "dollar_amt": [5, 8, 9, 10], "dollar_amt_df1": 10, "dollar_amt_df2": 10, "don": [0, 1, 8, 9, 10], "done": [1, 3, 10], "drop": [8, 10], "dtype": [8, 9, 10], "duckdb": [5, 6], "due": [3, 9], "dupe": 1, "duplic": 6, "e": [0, 1, 4], "each": [0, 1, 4, 5, 8, 10], "easier": 4, "easili": [0, 1], "edgetest": 6, "empti": 8, "encod": 1, "endless": 4, "engin": 9, "ensur": 4, "enter": 0, "enum": 1, "env": 7, "environ": [4, 7], "equal": [0, 1, 6, 8, 9, 10], "equival": 5, "evalu": [0, 1], "exact": [0, 1], "exactli": [0, 5, 8], "exampl": [1, 5, 8, 10], "excel": 4, "except": [0, 1], "exclud": 1, "execut": [0, 1, 4], "executor": 3, "exist": [0, 1], "expect": 6, "experi": 3, "experiment": 9, "export": 4, "extend": [0, 1, 6], "extra": 4, "f64": 9, "fail": [0, 8], "fals": [0, 1, 5, 8, 9, 10], "fast": [0, 3], "favour": 5, "featur": 4, "feedback": 5, "few": [8, 9, 10], "field": [0, 1, 8], "file": [0, 1], "filehandl": 1, "filenam": [0, 1], "fill": 8, "final": [4, 5], "fine": [6, 7], "first": [0, 1, 4, 8, 9, 10], "fit": 8, "flag": [0, 1], "float": [0, 1], "float64": [8, 9, 10], "float_fld": [5, 8, 9, 10], "float_fld_df1": 10, "float_fld_df2": 10, "folder": 4, "follow": [4, 5, 9], "for_displai": [0, 1], "forc": 0, "forg": 6, "form": 1, "format": [0, 1, 9], "forward": [3, 6, 10], "found": 6, "frame": [0, 1], "framework": 5, "from": [0, 1, 3, 4, 5, 6, 8, 9, 10], "from_panda": 10, "fugu": [2, 3, 6, 10], "full": 5, "fulli": [0, 1], "functioanl": [6, 7], "function": [0, 1, 5, 6, 9], "further": 3, "futur": [4, 6], "gather": 5, "gener": [0, 1, 3, 6, 8, 9, 10], "generate_id_within_group": [0, 1, 2, 6], "georg": [5, 8, 9, 10], "get": [0, 1, 5], "get_merged_column": [0, 1, 2, 6], "getorcr": [5, 10], "gh": 4, "ghpage": 4, "git": 4, "github": [4, 6], "given": 1, "go": [0, 1, 4], "goal": 8, "gold": 1, "good": 9, "googl": 4, "grain": 3, "great": 5, "group": [0, 1, 8, 10], "grow": 0, "guarante": 5, "guid": 6, "guidanc": 4, "gz": 4, "ha": [4, 6, 8, 9, 10], "handl": [0, 1, 3, 8, 9, 10], "hard": 3, "have": [0, 1, 3, 4, 5, 6, 8, 9, 10], "help": [3, 4], "helper": 4, "here": [4, 6, 8, 9, 10], "highli": 7, "honor": 6, "hook": 6, "hope": 5, "how": [0, 3, 4, 6], "html": [0, 1, 4], "html_file": [0, 1], "http": [4, 10], "human": [0, 1, 5, 8, 10], "i": [0, 1, 3, 4, 5, 6, 7, 8, 9, 10], "i64": 9, "id": [0, 1, 3, 8, 10], "idea": 3, "ident": [0, 1], "identifi": [0, 1], "ignor": [0, 1], "ignore_cas": [0, 1], "ignore_extra_column": [0, 1, 10], "ignore_matching_col": [0, 1], "ignore_spac": [0, 1], "implement": [3, 5, 6, 9, 10], "implementaion": [3, 10], "import": [5, 6, 8, 9, 10], "improv": 3, "includ": [0, 1, 4], "increas": 3, "independ": 4, "index": [0, 1, 6, 8, 9], "indic": [0, 1], "individu": [0, 1], "initi": 8, "input": 1, "instal": [4, 5], "instanc": [1, 8, 9, 10], "instanti": 1, "instead": [0, 1], "instruct": 6, "int": [0, 1], "integ": 0, "integr": [5, 6], "interact": 6, "interfac": [5, 6, 9], "intermedi": 1, "intersect": [0, 1], "intersect_column": [0, 1, 2, 5, 6, 8, 9, 10], "intersect_row": [0, 1, 8, 9, 10], "intersect_rows_match": [0, 1, 2], "introduc": [6, 10], "io": [5, 8, 9, 10], "is_match": [0, 2, 5, 6], "isclos": [0, 1], "isn": 0, "isort": 4, "issu": [3, 6, 10], "its": [0, 1, 3, 6], "jira": 10, "join": [0, 1, 3, 5, 8, 9, 10], "join_column": [0, 1, 5, 8, 9, 10], "join_nul": 9, "just": [0, 1, 4, 5, 6, 9], "keep": [4, 6, 10], "kei": 1, "kinda": [0, 1], "know": 8, "known": 1, "known_differ": [0, 1], "larg": [1, 3, 8], "lazi": 1, "legaci": [0, 2, 4, 10], "legacysparkcompar": [0, 1, 6, 10], "let": [0, 4, 6], "level": 6, "librari": [5, 6], "licens": 6, "like": [0, 4, 5, 6, 8, 9, 10], "limit": 6, "list": [0, 1, 5, 8, 9, 10], "ll": 4, "loblaw": [5, 8, 9, 10], "local": 4, "logic": [6, 10], "look": [0, 1, 8], "loos": [5, 8, 9, 10], "lot": [3, 8], "lower": [0, 1], "lowest": 6, "lucil": [5, 8, 9, 10], "m": 4, "machin": [3, 4], "mahari": [5, 8, 9, 10], "mai": [5, 8, 9], "main": [4, 8], "maintain": 5, "make": [1, 3, 4, 6], "makefil": 4, "manag": [5, 6], "mani": [5, 6], "map": 5, "match": [0, 1, 2, 6, 8, 9, 10], "match_rat": 1, "matchin": 0, "matchtyp": [0, 1], "matrix": 6, "max": [1, 8, 9, 10], "maximum": [0, 1], "mean": [3, 6], "meant": [0, 1], "medium": 3, "mediumish": 3, "memori": [1, 8, 9], "mention": 9, "merg": [0, 1, 4, 8, 10], "merged_df": [0, 1], "messag": 4, "method": [5, 6], "michael": [5, 8, 9, 10], "might": 9, "migrat": 9, "million": 3, "minim": 3, "mismatch": [0, 1], "mix": 0, "mode": 1, "model": 9, "modul": [2, 6, 10], "montonicli": 3, "more": [0, 1, 4, 6, 8], "most": [3, 4], "move": [3, 6, 10], "much": 4, "multipl": 1, "must": [0, 4, 5, 9], "my_report": 1, "name": [0, 1, 5, 7, 8, 9, 10], "name_df1": [8, 9, 10], "name_df2": [8, 9, 10], "name_match": [8, 9, 10], "nan": [0, 1, 8, 9, 10], "nativ": [3, 5, 6, 10], "natur": 3, "na\u00efv": 8, "need": [4, 5, 8], "new": [0, 1, 4, 5, 6, 8, 9, 10], "newlin": [0, 1], "nice": [0, 1], "non": [0, 1, 5], "none": [0, 1, 4], "note": [0, 1, 4, 5, 6, 7, 8, 9, 10], "notic": 5, "now": [6, 10], "np": [0, 1], "npt": 8, "null": [0, 1, 8, 9, 10], "number": [0, 1, 3, 8, 9, 10], "numer": [0, 1, 3], "numpi": [4, 8], "obj1": 8, "obj2": 8, "object": [1, 6], "obsolet": 3, "offic": 10, "offici": 4, "olap": 9, "old": [6, 10], "on_index": [0, 8, 10], "onc": 4, "one": [0, 1, 4, 9, 10], "onli": [0, 1, 4, 8, 9, 10], "open": [0, 1, 6], "oper": [0, 1, 5, 8], "option": [0, 1, 4, 5, 10], "order": [0, 1, 4, 5], "orderedset": [0, 1, 9, 10], "org": [4, 10], "origin": [0, 1, 5, 6, 8, 9, 10], "original_df": [0, 1], "orphan": 4, "other": [0, 1, 4, 5, 6, 8, 10], "otherwis": 1, "our": 3, "out": [0, 1, 4, 5, 6, 10], "output": [0, 1, 4, 8], "over": [0, 6], "overlap": [0, 1], "overview": 6, "overwrit": [0, 1], "p": 10, "packag": [2, 4, 6], "page": [4, 6], "panda": [0, 2, 3, 4, 5, 6, 7, 9, 10], "parallel": [0, 5], "paramet": [0, 1], "particip": 6, "partit": 5, "pass": [0, 1, 4, 5], "pd": [5, 8, 10], "peopl": 4, "per": 4, "perform": [1, 3, 5, 6, 10], "pertin": [0, 1], "pick": 8, "pilot": 5, "pip": [4, 5, 6, 7], "pl": 9, "plan": 6, "pleas": [3, 5, 6, 7, 9], "polar": [2, 3, 5, 6, 7], "polarscompar": [0, 2, 6, 9], "pollut": 4, "port": 9, "post": [0, 1], "pre": [0, 1, 6], "preform": 3, "prepend": [0, 1], "present": [0, 1], "prevent": [1, 4], "print": [0, 1, 5, 6, 8, 9, 10], "proc": [0, 1, 6, 8], "process": [3, 4, 5, 6], "produc": 5, "project": [4, 6], "properli": 4, "properti": [0, 1], "proport": 1, "provid": [0, 1, 5, 6, 8, 10], "pure": 3, "push": 4, "py": 4, "py3": 4, "pypi": 6, "pyproject": 4, "pysaprk": [6, 10], "pyspark": [0, 1, 5, 6, 10], "pytest": 4, "python": [4, 5, 6, 7], "pyyaml": 4, "qualiti": 4, "queri": 9, "question": 1, "rai": [5, 6], "rais": 0, "ram": 3, "rang": 3, "rate": 1, "raw": [0, 1], "re": [8, 10], "read": [0, 1], "read_csv": [5, 8, 9, 10], "readabl": [0, 1, 5, 8, 10], "readi": 1, "real": 4, "reason": 4, "recogn": [8, 10], "recommend": 7, "recomput": 1, "record": [0, 1, 3], "redirect": 1, "refer": 1, "regener": 4, "rel": [0, 1, 8, 9, 10], "rel_tol": [0, 1, 5, 8, 9, 10], "relat": 5, "releas": 6, "renam": [6, 10], "render": [0, 1, 2, 4, 6], "replac": [0, 1, 5, 6, 8, 9, 10], "repo": [4, 6], "report": [0, 1, 2, 5, 6], "report_fil": 1, "repositori": 4, "repres": 0, "represent": [0, 1], "requir": 6, "resili": [8, 9], "result": [1, 3, 5, 9], "return": [0, 1, 4, 8, 9, 10], "right": 4, "robert": [5, 8, 9, 10], "root": 4, "row": [0, 1, 3, 6], "rows_both_al": [0, 1], "rows_both_mismatch": [0, 1], "rows_only_bas": [0, 1], "rows_only_compar": [0, 1], "run": [3, 6, 8, 9, 10], "runner": 4, "rust": 9, "sa": [0, 1, 6, 8], "safe": 10, "salt": 3, "same": [0, 1, 5, 8], "sampl": [0, 1, 5, 8, 9, 10], "sample_count": [0, 1], "sample_mismatch": [0, 1, 2], "save": [0, 1], "scene": [8, 10], "schema": 0, "seal": [5, 8, 9, 10], "search": 6, "second": [0, 1, 3, 8, 10], "section": [4, 9], "see": [3, 6, 9], "seem": 3, "semant": [4, 5], "sens": 1, "separ": 8, "seri": [0, 1, 8], "seriestyp": 0, "serv": [1, 4], "set": [0, 1, 4, 8], "setup": [4, 6], "setuptool": 7, "sever": 4, "shape": 9, "share": [0, 1], "shine": 3, "should": [0, 1, 4, 6, 7, 8, 9, 10], "show": [0, 1], "show_all_column": 1, "shown": 1, "sign": 6, "significantli": 1, "similar": [0, 1, 9], "simpl": [4, 5, 6], "sinc": 4, "singl": [3, 4], "size": 1, "skip": [0, 1], "slightli": 9, "slower": 3, "small": 3, "so": [6, 8, 9, 10], "some": [0, 1, 3, 6, 8, 9, 10], "some_field": 8, "someth": [0, 4, 6], "somewhat": 8, "soon": 4, "sort": 8, "sourc": [6, 7], "spark": [0, 2, 3, 5], "spark_df2": 5, "spark_sess": [0, 1], "sparkcompar": [1, 5, 6, 10], "sparkpandascompar": [0, 1, 2, 6], "sparksess": [0, 1, 5, 10], "sparksqlcompar": [0, 1, 2, 6], "specif": 5, "specifi": [1, 5, 8, 9, 10], "speed": 1, "sphinx": 4, "sql": [0, 2, 3, 5, 6, 10], "squash": 4, "standard": 1, "start": [0, 3, 6], "stat": [0, 6], "statement": 1, "stdout": 1, "step": [1, 8], "still": 4, "store": 4, "str": [0, 1, 9], "streamlin": 4, "strict_schema": 0, "string": [0, 1, 3, 8, 9, 10], "stringio": [5, 8, 9, 10], "strip": [0, 1], "style": 4, "sub": [0, 1], "subfold": 4, "submodul": [2, 6, 10], "subpackag": [2, 6], "subsequ": [6, 10], "subset": [0, 1, 2, 4], "suffix": [0, 1], "summar": [5, 10], "summari": [1, 8, 9, 10], "support": [0, 7, 8, 9], "sure": [4, 6], "sy": 1, "synthet": 3, "t": [0, 1, 8, 9, 10], "tabl": [3, 5, 8, 9, 10], "tag": 4, "take": [1, 3], "taken": 4, "tar": 4, "temp": 0, "temp_column_nam": [0, 2, 6], "temp_id": [8, 10], "templat": [0, 1], "temporari": [0, 8, 10], "test": [6, 7, 8, 10], "textio": 1, "textiowrapp": 1, "than": [0, 5, 6], "thei": [4, 9], "them": 8, "thi": [0, 1, 4, 5, 6, 8, 9, 10], "thing": 9, "third": [8, 10], "though": 5, "time": [3, 6], "tldr": 6, "toler": [0, 1, 8, 9, 10], "toml": 4, "toni": [8, 10], "top": 9, "total": [8, 9, 10], "track": [0, 1], "transform": 1, "treat": 1, "tri": [0, 1, 3, 9], "trigger": [0, 1], "true": [0, 1, 4, 8, 9, 10], "try": [8, 9, 10], "tune": 3, "tupl": 1, "tweak": [0, 6], "twine": 4, "two": [0, 1, 5, 6, 8, 9, 10], "txt": 1, "type": [0, 1, 4, 8, 9, 10], "ultim": 1, "under": [4, 6, 10], "understand": 3, "unequ": [8, 9, 10], "unexpect": 9, "unifi": [5, 6], "uniqu": [0, 1, 8, 10], "unit": 6, "unittest": 4, "unlik": 9, "unq_column": [0, 2, 5, 6], "until": 10, "up": [1, 4, 8], "updat": 4, "upgrad": [4, 7], "upload": 4, "url": 4, "us": [0, 1, 4, 5, 6, 7, 8, 9, 10], "usag": 6, "user": [0, 1, 3, 4], "utf": 1, "util": 4, "v0": [6, 9, 10], "valu": [0, 1, 8, 9, 10], "valueerror": 8, "vanilla": 0, "variabl": [0, 1], "vast": 3, "ve": 3, "veri": [3, 8, 9], "versa": [0, 1], "version": [0, 1, 3, 4, 5, 9], "via": [4, 5, 6], "vice": [0, 1], "virtual": 7, "virtualenv": 6, "w": 1, "wa": [0, 1, 3, 6, 10], "wai": [0, 1, 5, 6], "want": [4, 5], "we": [3, 4, 5, 6, 10], "welcom": [3, 6], "what": [0, 1, 6, 8], "wheel": 4, "when": [0, 1, 3, 4, 8], "where": [0, 1, 4], "whether": [0, 1, 8], "which": [0, 1, 3, 4, 5, 6, 8, 9, 10], "while": 1, "whitespac": [0, 1], "whl": 4, "wide": 1, "wisdom": 4, "wise": [0, 1], "wish": [6, 10], "within": [0, 1, 6, 8, 10], "without": [0, 1], "wonder": [8, 10], "work": [1, 4, 6, 7], "workflow": 4, "world": 1, "would": [1, 6], "write": 1, "x": [0, 1], "y": 1, "ye": [8, 9], "yield": 9, "you": [0, 1, 3, 4, 5, 6, 7, 8, 9, 10], "your": [1, 4, 6, 8, 9, 10], "zero": 0}, "titles": ["datacompy package", "datacompy.spark package", "datacompy", "Benchmarks", "Developer Instructions", "Fugue Detail", "DataComPy", "Installation", "Pandas Usage", "Polars Usage", "Spark Usage"], "titleterms": {"The": 3, "api": 6, "archiv": 4, "backend": 6, "base": 0, "basic": [5, 7, 9], "benchmark": 3, "caveat": [8, 9], "commit": 4, "compar": [5, 8, 9], "conda": 7, "content": [0, 1, 6], "contributor": 6, "conveni": [8, 9, 10], "core": 0, "cross": 5, "data": 3, "datacompi": [0, 1, 2, 6], "depend": 7, "dependnci": 6, "deprec": 6, "detail": 5, "develop": 4, "distribut": 4, "document": 4, "duplic": [8, 9, 10], "edgetest": 4, "extra": 6, "forg": 7, "from": 7, "fugu": [0, 5], "futur": 5, "gener": 4, "guid": 4, "hook": 4, "how": 5, "indic": 6, "instal": [6, 7], "instruct": 4, "legaci": [1, 6], "limit": [8, 9], "manag": 4, "method": [8, 9, 10], "modul": [0, 1], "object": [8, 9, 10], "overview": [8, 9], "packag": [0, 1], "panda": [1, 8], "polar": [0, 9], "pre": 4, "pypi": [4, 7], "quick": 6, "refer": 6, "releas": [4, 5], "report": [8, 9, 10], "requir": 4, "roadmap": 6, "row": [8, 9, 10], "run": 4, "setup": [3, 8, 9, 10], "spark": [1, 6, 10], "sparkpandascompar": 10, "sparksqlcompar": 10, "sql": 1, "submodul": [0, 1], "subpackag": 0, "support": [6, 10], "tabl": 6, "test": 4, "tldr": 3, "unit": 4, "us": 3, "usag": [5, 8, 9, 10], "version": [6, 10], "virtualenv": 7, "work": 5}})
\ No newline at end of file
+Search.setIndex({"alltitles": {"API Reference": [[6, null]], "Basic Usage": [[5, "basic-usage"], [9, "basic-usage"]], "Benchmarks": [[3, null]], "Caveats": [[8, "caveats"]], "Caveats and Limitations": [[9, "caveats-and-limitations"]], "Compare Object Setup": [[8, "compare-object-setup"], [9, "compare-object-setup"]], "Contents": [[6, "contents"]], "Contributors": [[6, "contributors"]], "Convenience Methods": [[8, "convenience-methods"], [9, "convenience-methods"], [10, "convenience-methods"]], "Cross Comparing": [[5, "cross-comparing"]], "DataComPy": [[6, null]], "Developer Instructions": [[4, null]], "Duplicate rows": [[8, "duplicate-rows"], [9, "duplicate-rows"], [10, "duplicate-rows"]], "Fugue Detail": [[5, null]], "Future releases": [[5, "future-releases"]], "Generating Documentation": [[4, "generating-documentation"]], "Generating distribution archives (PyPI)": [[4, "generating-distribution-archives-pypi"]], "How it works": [[5, "how-it-works"]], "Indices and tables": [[6, "indices-and-tables"]], "Installation": [[7, null]], "Installing extras": [[6, "installing-extras"]], "Legacy Spark Deprecation": [[6, "legacy-spark-deprecation"]], "Limitations": [[8, "limitations"]], "Management of Requirements": [[4, "management-of-requirements"]], "Module contents": [[0, "module-datacompy"], [1, "module-datacompy.spark"]], "Overview": [[8, "overview"], [9, "overview"]], "Pandas Usage": [[8, null]], "Polars Usage": [[9, null]], "Pre-Commit Hooks": [[4, "pre-commit-hooks"]], "PyPI (basic)": [[7, "pypi-basic"]], "Quick Installation": [[6, "quick-installation"]], "Release Guide": [[4, "release-guide"]], "Reports": [[8, "reports"], [9, "reports"], [10, "reports"]], "Roadmap": [[6, "roadmap"]], "Run unit tests": [[4, "run-unit-tests"]], "Setup used": [[3, "setup-used"]], "Spark Usage": [[10, null]], "SparkPandasCompare Deprecation": [[6, "sparkpandascompare-deprecation"]], "SparkSQLCompare": [[10, "sparksqlcompare"]], "Submodules": [[0, "submodules"], [1, "submodules"]], "Subpackages": [[0, "subpackages"]], "Supported backends": [[6, "supported-backends"]], "Supported versions and dependncies": [[6, "supported-versions-and-dependncies"]], "TLDR": [[3, "tldr"]], "The Data": [[3, "the-data"]], "conda (installs dependencies from Conda Forge)": [[7, "conda-installs-dependencies-from-conda-forge"]], "datacompy": [[2, null]], "datacompy package": [[0, null]], "datacompy.base module": [[0, "module-datacompy.base"]], "datacompy.core module": [[0, "module-datacompy.core"]], "datacompy.fugue module": [[0, "module-datacompy.fugue"]], "datacompy.polars module": [[0, "module-datacompy.polars"]], "datacompy.spark package": [[1, null]], "datacompy.spark.legacy module": [[1, "module-datacompy.spark.legacy"]], "datacompy.spark.pandas module": [[1, "module-datacompy.spark.pandas"]], "datacompy.spark.sql module": [[1, "module-datacompy.spark.sql"]], "edgetest": [[4, "edgetest"]], "virtualenv (install dependencies from PyPI)": [[7, "virtualenv-install-dependencies-from-pypi"]]}, "docnames": ["api/datacompy", "api/datacompy.spark", "api/modules", "benchmark", "developer_instructions", "fugue_usage", "index", "install", "pandas_usage", "polars_usage", "spark_usage"], "envversion": {"sphinx": 62, "sphinx.domains.c": 3, "sphinx.domains.changeset": 1, "sphinx.domains.citation": 1, "sphinx.domains.cpp": 9, "sphinx.domains.index": 1, "sphinx.domains.javascript": 3, "sphinx.domains.math": 2, "sphinx.domains.python": 4, "sphinx.domains.rst": 2, "sphinx.domains.std": 2}, "filenames": ["api/datacompy.rst", "api/datacompy.spark.rst", "api/modules.rst", "benchmark.rst", "developer_instructions.rst", "fugue_usage.rst", "index.rst", "install.rst", "pandas_usage.rst", "polars_usage.rst", "spark_usage.rst"], "indexentries": {"all_columns_match() (datacompy.base.basecompare method)": [[0, "datacompy.base.BaseCompare.all_columns_match", false]], "all_columns_match() (datacompy.basecompare method)": [[0, "datacompy.BaseCompare.all_columns_match", false]], "all_columns_match() (datacompy.compare method)": [[0, "datacompy.Compare.all_columns_match", false]], "all_columns_match() (datacompy.core.compare method)": [[0, "datacompy.core.Compare.all_columns_match", false]], "all_columns_match() (datacompy.polars.polarscompare method)": [[0, "datacompy.polars.PolarsCompare.all_columns_match", false]], "all_columns_match() (datacompy.polarscompare method)": [[0, "datacompy.PolarsCompare.all_columns_match", false]], "all_columns_match() (datacompy.spark.pandas.sparkpandascompare method)": [[1, "datacompy.spark.pandas.SparkPandasCompare.all_columns_match", false]], "all_columns_match() (datacompy.spark.sql.sparksqlcompare method)": [[1, "datacompy.spark.sql.SparkSQLCompare.all_columns_match", false]], "all_columns_match() (datacompy.sparkpandascompare method)": [[0, "datacompy.SparkPandasCompare.all_columns_match", false]], "all_columns_match() (datacompy.sparksqlcompare method)": [[0, "datacompy.SparkSQLCompare.all_columns_match", false]], "all_columns_match() (in module datacompy)": [[0, "datacompy.all_columns_match", false]], "all_columns_match() (in module datacompy.fugue)": [[0, "datacompy.fugue.all_columns_match", false]], "all_mismatch() (datacompy.base.basecompare method)": [[0, "datacompy.base.BaseCompare.all_mismatch", false]], "all_mismatch() (datacompy.basecompare method)": [[0, "datacompy.BaseCompare.all_mismatch", false]], "all_mismatch() (datacompy.compare method)": [[0, "datacompy.Compare.all_mismatch", false]], "all_mismatch() (datacompy.core.compare method)": [[0, "datacompy.core.Compare.all_mismatch", false]], "all_mismatch() (datacompy.polars.polarscompare method)": [[0, "datacompy.polars.PolarsCompare.all_mismatch", false]], "all_mismatch() (datacompy.polarscompare method)": [[0, "datacompy.PolarsCompare.all_mismatch", false]], "all_mismatch() (datacompy.spark.pandas.sparkpandascompare method)": [[1, "datacompy.spark.pandas.SparkPandasCompare.all_mismatch", false]], "all_mismatch() (datacompy.spark.sql.sparksqlcompare method)": [[1, "datacompy.spark.sql.SparkSQLCompare.all_mismatch", false]], "all_mismatch() (datacompy.sparkpandascompare method)": [[0, "datacompy.SparkPandasCompare.all_mismatch", false]], "all_mismatch() (datacompy.sparksqlcompare method)": [[0, "datacompy.SparkSQLCompare.all_mismatch", false]], "all_rows_overlap() (datacompy.base.basecompare method)": [[0, "datacompy.base.BaseCompare.all_rows_overlap", false]], "all_rows_overlap() (datacompy.basecompare method)": [[0, "datacompy.BaseCompare.all_rows_overlap", false]], "all_rows_overlap() (datacompy.compare method)": [[0, "datacompy.Compare.all_rows_overlap", false]], "all_rows_overlap() (datacompy.core.compare method)": [[0, "datacompy.core.Compare.all_rows_overlap", false]], "all_rows_overlap() (datacompy.polars.polarscompare method)": [[0, "datacompy.polars.PolarsCompare.all_rows_overlap", false]], "all_rows_overlap() (datacompy.polarscompare method)": [[0, "datacompy.PolarsCompare.all_rows_overlap", false]], "all_rows_overlap() (datacompy.spark.pandas.sparkpandascompare method)": [[1, "datacompy.spark.pandas.SparkPandasCompare.all_rows_overlap", false]], "all_rows_overlap() (datacompy.spark.sql.sparksqlcompare method)": [[1, "datacompy.spark.sql.SparkSQLCompare.all_rows_overlap", false]], "all_rows_overlap() (datacompy.sparkpandascompare method)": [[0, "datacompy.SparkPandasCompare.all_rows_overlap", false]], "all_rows_overlap() (datacompy.sparksqlcompare method)": [[0, "datacompy.SparkSQLCompare.all_rows_overlap", false]], "all_rows_overlap() (in module datacompy)": [[0, "datacompy.all_rows_overlap", false]], "all_rows_overlap() (in module datacompy.fugue)": [[0, "datacompy.fugue.all_rows_overlap", false]], "base_row_count (datacompy.spark.legacy.legacysparkcompare property)": [[1, "datacompy.spark.legacy.LegacySparkCompare.base_row_count", false]], "basecompare (class in datacompy)": [[0, "datacompy.BaseCompare", false]], "basecompare (class in datacompy.base)": [[0, "datacompy.base.BaseCompare", false]], "calculate_max_diff() (in module datacompy)": [[0, "datacompy.calculate_max_diff", false]], "calculate_max_diff() (in module datacompy.core)": [[0, "datacompy.core.calculate_max_diff", false]], "calculate_max_diff() (in module datacompy.polars)": [[0, "datacompy.polars.calculate_max_diff", false]], "calculate_max_diff() (in module datacompy.spark.pandas)": [[1, "datacompy.spark.pandas.calculate_max_diff", false]], "calculate_max_diff() (in module datacompy.spark.sql)": [[1, "datacompy.spark.sql.calculate_max_diff", false]], "calculate_null_diff() (in module datacompy.spark.sql)": [[1, "datacompy.spark.sql.calculate_null_diff", false]], "columns_compared (datacompy.spark.legacy.legacysparkcompare property)": [[1, "datacompy.spark.legacy.LegacySparkCompare.columns_compared", false]], "columns_equal() (in module datacompy)": [[0, "datacompy.columns_equal", false]], "columns_equal() (in module datacompy.core)": [[0, "datacompy.core.columns_equal", false]], "columns_equal() (in module datacompy.polars)": [[0, "datacompy.polars.columns_equal", false]], "columns_equal() (in module datacompy.spark.pandas)": [[1, "datacompy.spark.pandas.columns_equal", false]], "columns_equal() (in module datacompy.spark.sql)": [[1, "datacompy.spark.sql.columns_equal", false]], "columns_in_both (datacompy.spark.legacy.legacysparkcompare property)": [[1, "datacompy.spark.legacy.LegacySparkCompare.columns_in_both", false]], "columns_only_base (datacompy.spark.legacy.legacysparkcompare property)": [[1, "datacompy.spark.legacy.LegacySparkCompare.columns_only_base", false]], "columns_only_compare (datacompy.spark.legacy.legacysparkcompare property)": [[1, "datacompy.spark.legacy.LegacySparkCompare.columns_only_compare", false]], "common_row_count (datacompy.spark.legacy.legacysparkcompare property)": [[1, "datacompy.spark.legacy.LegacySparkCompare.common_row_count", false]], "compare (class in datacompy)": [[0, "datacompy.Compare", false]], "compare (class in datacompy.core)": [[0, "datacompy.core.Compare", false]], "compare_row_count (datacompy.spark.legacy.legacysparkcompare property)": [[1, "datacompy.spark.legacy.LegacySparkCompare.compare_row_count", false]], "compare_string_and_date_columns() (in module datacompy)": [[0, "datacompy.compare_string_and_date_columns", false]], "compare_string_and_date_columns() (in module datacompy.core)": [[0, "datacompy.core.compare_string_and_date_columns", false]], "compare_string_and_date_columns() (in module datacompy.polars)": [[0, "datacompy.polars.compare_string_and_date_columns", false]], "compare_string_and_date_columns() (in module datacompy.spark.pandas)": [[1, "datacompy.spark.pandas.compare_string_and_date_columns", false]], "count_matching_rows() (datacompy.base.basecompare method)": [[0, "datacompy.base.BaseCompare.count_matching_rows", false]], "count_matching_rows() (datacompy.basecompare method)": [[0, "datacompy.BaseCompare.count_matching_rows", false]], "count_matching_rows() (datacompy.compare method)": [[0, "datacompy.Compare.count_matching_rows", false]], "count_matching_rows() (datacompy.core.compare method)": [[0, "datacompy.core.Compare.count_matching_rows", false]], "count_matching_rows() (datacompy.polars.polarscompare method)": [[0, "datacompy.polars.PolarsCompare.count_matching_rows", false]], "count_matching_rows() (datacompy.polarscompare method)": [[0, "datacompy.PolarsCompare.count_matching_rows", false]], "count_matching_rows() (datacompy.spark.pandas.sparkpandascompare method)": [[1, "datacompy.spark.pandas.SparkPandasCompare.count_matching_rows", false]], "count_matching_rows() (datacompy.spark.sql.sparksqlcompare method)": [[1, "datacompy.spark.sql.SparkSQLCompare.count_matching_rows", false]], "count_matching_rows() (datacompy.sparkpandascompare method)": [[0, "datacompy.SparkPandasCompare.count_matching_rows", false]], "count_matching_rows() (datacompy.sparksqlcompare method)": [[0, "datacompy.SparkSQLCompare.count_matching_rows", false]], "count_matching_rows() (in module datacompy)": [[0, "datacompy.count_matching_rows", false]], "count_matching_rows() (in module datacompy.fugue)": [[0, "datacompy.fugue.count_matching_rows", false]], "datacompy": [[0, "module-datacompy", false]], "datacompy.base": [[0, "module-datacompy.base", false]], "datacompy.core": [[0, "module-datacompy.core", false]], "datacompy.fugue": [[0, "module-datacompy.fugue", false]], "datacompy.polars": [[0, "module-datacompy.polars", false]], "datacompy.spark": [[1, "module-datacompy.spark", false]], "datacompy.spark.legacy": [[1, "module-datacompy.spark.legacy", false]], "datacompy.spark.pandas": [[1, "module-datacompy.spark.pandas", false]], "datacompy.spark.sql": [[1, "module-datacompy.spark.sql", false]], "decimal_comparator() (in module datacompy.spark.legacy)": [[1, "datacompy.spark.legacy.decimal_comparator", false]], "decimal_comparator() (in module datacompy.spark.sql)": [[1, "datacompy.spark.sql.decimal_comparator", false]], "df1 (datacompy.base.basecompare property)": [[0, "datacompy.base.BaseCompare.df1", false]], "df1 (datacompy.basecompare property)": [[0, "datacompy.BaseCompare.df1", false]], "df1 (datacompy.compare property)": [[0, "datacompy.Compare.df1", false]], "df1 (datacompy.core.compare property)": [[0, "datacompy.core.Compare.df1", false]], "df1 (datacompy.polars.polarscompare property)": [[0, "datacompy.polars.PolarsCompare.df1", false]], "df1 (datacompy.polarscompare property)": [[0, "datacompy.PolarsCompare.df1", false]], "df1 (datacompy.spark.pandas.sparkpandascompare property)": [[1, "datacompy.spark.pandas.SparkPandasCompare.df1", false]], "df1 (datacompy.spark.sql.sparksqlcompare property)": [[1, "datacompy.spark.sql.SparkSQLCompare.df1", false]], "df1 (datacompy.sparkpandascompare property)": [[0, "datacompy.SparkPandasCompare.df1", false]], "df1 (datacompy.sparksqlcompare property)": [[0, "datacompy.SparkSQLCompare.df1", false]], "df1_unq_columns() (datacompy.base.basecompare method)": [[0, "datacompy.base.BaseCompare.df1_unq_columns", false]], "df1_unq_columns() (datacompy.basecompare method)": [[0, "datacompy.BaseCompare.df1_unq_columns", false]], "df1_unq_columns() (datacompy.compare method)": [[0, "datacompy.Compare.df1_unq_columns", false]], "df1_unq_columns() (datacompy.core.compare method)": [[0, "datacompy.core.Compare.df1_unq_columns", false]], "df1_unq_columns() (datacompy.polars.polarscompare method)": [[0, "datacompy.polars.PolarsCompare.df1_unq_columns", false]], "df1_unq_columns() (datacompy.polarscompare method)": [[0, "datacompy.PolarsCompare.df1_unq_columns", false]], "df1_unq_columns() (datacompy.spark.pandas.sparkpandascompare method)": [[1, "datacompy.spark.pandas.SparkPandasCompare.df1_unq_columns", false]], "df1_unq_columns() (datacompy.spark.sql.sparksqlcompare method)": [[1, "datacompy.spark.sql.SparkSQLCompare.df1_unq_columns", false]], "df1_unq_columns() (datacompy.sparkpandascompare method)": [[0, "datacompy.SparkPandasCompare.df1_unq_columns", false]], "df1_unq_columns() (datacompy.sparksqlcompare method)": [[0, "datacompy.SparkSQLCompare.df1_unq_columns", false]], "df2 (datacompy.base.basecompare property)": [[0, "datacompy.base.BaseCompare.df2", false]], "df2 (datacompy.basecompare property)": [[0, "datacompy.BaseCompare.df2", false]], "df2 (datacompy.compare property)": [[0, "datacompy.Compare.df2", false]], "df2 (datacompy.core.compare property)": [[0, "datacompy.core.Compare.df2", false]], "df2 (datacompy.polars.polarscompare property)": [[0, "datacompy.polars.PolarsCompare.df2", false]], "df2 (datacompy.polarscompare property)": [[0, "datacompy.PolarsCompare.df2", false]], "df2 (datacompy.spark.pandas.sparkpandascompare property)": [[1, "datacompy.spark.pandas.SparkPandasCompare.df2", false]], "df2 (datacompy.spark.sql.sparksqlcompare property)": [[1, "datacompy.spark.sql.SparkSQLCompare.df2", false]], "df2 (datacompy.sparkpandascompare property)": [[0, "datacompy.SparkPandasCompare.df2", false]], "df2 (datacompy.sparksqlcompare property)": [[0, "datacompy.SparkSQLCompare.df2", false]], "df2_unq_columns() (datacompy.base.basecompare method)": [[0, "datacompy.base.BaseCompare.df2_unq_columns", false]], "df2_unq_columns() (datacompy.basecompare method)": [[0, "datacompy.BaseCompare.df2_unq_columns", false]], "df2_unq_columns() (datacompy.compare method)": [[0, "datacompy.Compare.df2_unq_columns", false]], "df2_unq_columns() (datacompy.core.compare method)": [[0, "datacompy.core.Compare.df2_unq_columns", false]], "df2_unq_columns() (datacompy.polars.polarscompare method)": [[0, "datacompy.polars.PolarsCompare.df2_unq_columns", false]], "df2_unq_columns() (datacompy.polarscompare method)": [[0, "datacompy.PolarsCompare.df2_unq_columns", false]], "df2_unq_columns() (datacompy.spark.pandas.sparkpandascompare method)": [[1, "datacompy.spark.pandas.SparkPandasCompare.df2_unq_columns", false]], "df2_unq_columns() (datacompy.spark.sql.sparksqlcompare method)": [[1, "datacompy.spark.sql.SparkSQLCompare.df2_unq_columns", false]], "df2_unq_columns() (datacompy.sparkpandascompare method)": [[0, "datacompy.SparkPandasCompare.df2_unq_columns", false]], "df2_unq_columns() (datacompy.sparksqlcompare method)": [[0, "datacompy.SparkSQLCompare.df2_unq_columns", false]], "generate_id_within_group() (in module datacompy)": [[0, "datacompy.generate_id_within_group", false]], "generate_id_within_group() (in module datacompy.core)": [[0, "datacompy.core.generate_id_within_group", false]], "generate_id_within_group() (in module datacompy.polars)": [[0, "datacompy.polars.generate_id_within_group", false]], "generate_id_within_group() (in module datacompy.spark.pandas)": [[1, "datacompy.spark.pandas.generate_id_within_group", false]], "get_merged_columns() (in module datacompy)": [[0, "datacompy.get_merged_columns", false]], "get_merged_columns() (in module datacompy.core)": [[0, "datacompy.core.get_merged_columns", false]], "get_merged_columns() (in module datacompy.polars)": [[0, "datacompy.polars.get_merged_columns", false]], "get_merged_columns() (in module datacompy.spark.pandas)": [[1, "datacompy.spark.pandas.get_merged_columns", false]], "get_merged_columns() (in module datacompy.spark.sql)": [[1, "datacompy.spark.sql.get_merged_columns", false]], "intersect_columns() (datacompy.base.basecompare method)": [[0, "datacompy.base.BaseCompare.intersect_columns", false]], "intersect_columns() (datacompy.basecompare method)": [[0, "datacompy.BaseCompare.intersect_columns", false]], "intersect_columns() (datacompy.compare method)": [[0, "datacompy.Compare.intersect_columns", false]], "intersect_columns() (datacompy.core.compare method)": [[0, "datacompy.core.Compare.intersect_columns", false]], "intersect_columns() (datacompy.polars.polarscompare method)": [[0, "datacompy.polars.PolarsCompare.intersect_columns", false]], "intersect_columns() (datacompy.polarscompare method)": [[0, "datacompy.PolarsCompare.intersect_columns", false]], "intersect_columns() (datacompy.spark.pandas.sparkpandascompare method)": [[1, "datacompy.spark.pandas.SparkPandasCompare.intersect_columns", false]], "intersect_columns() (datacompy.spark.sql.sparksqlcompare method)": [[1, "datacompy.spark.sql.SparkSQLCompare.intersect_columns", false]], "intersect_columns() (datacompy.sparkpandascompare method)": [[0, "datacompy.SparkPandasCompare.intersect_columns", false]], "intersect_columns() (datacompy.sparksqlcompare method)": [[0, "datacompy.SparkSQLCompare.intersect_columns", false]], "intersect_columns() (in module datacompy)": [[0, "datacompy.intersect_columns", false]], "intersect_columns() (in module datacompy.fugue)": [[0, "datacompy.fugue.intersect_columns", false]], "intersect_rows_match() (datacompy.base.basecompare method)": [[0, "datacompy.base.BaseCompare.intersect_rows_match", false]], "intersect_rows_match() (datacompy.basecompare method)": [[0, "datacompy.BaseCompare.intersect_rows_match", false]], "intersect_rows_match() (datacompy.compare method)": [[0, "datacompy.Compare.intersect_rows_match", false]], "intersect_rows_match() (datacompy.core.compare method)": [[0, "datacompy.core.Compare.intersect_rows_match", false]], "intersect_rows_match() (datacompy.polars.polarscompare method)": [[0, "datacompy.polars.PolarsCompare.intersect_rows_match", false]], "intersect_rows_match() (datacompy.polarscompare method)": [[0, "datacompy.PolarsCompare.intersect_rows_match", false]], "intersect_rows_match() (datacompy.spark.pandas.sparkpandascompare method)": [[1, "datacompy.spark.pandas.SparkPandasCompare.intersect_rows_match", false]], "intersect_rows_match() (datacompy.spark.sql.sparksqlcompare method)": [[1, "datacompy.spark.sql.SparkSQLCompare.intersect_rows_match", false]], "intersect_rows_match() (datacompy.sparkpandascompare method)": [[0, "datacompy.SparkPandasCompare.intersect_rows_match", false]], "intersect_rows_match() (datacompy.sparksqlcompare method)": [[0, "datacompy.SparkSQLCompare.intersect_rows_match", false]], "is_match() (in module datacompy)": [[0, "datacompy.is_match", false]], "is_match() (in module datacompy.fugue)": [[0, "datacompy.fugue.is_match", false]], "known_difference (datacompy.spark.legacy.matchtype attribute)": [[1, "datacompy.spark.legacy.MatchType.KNOWN_DIFFERENCE", false]], "legacysparkcompare (class in datacompy.spark.legacy)": [[1, "datacompy.spark.legacy.LegacySparkCompare", false]], "match (datacompy.spark.legacy.matchtype attribute)": [[1, "datacompy.spark.legacy.MatchType.MATCH", false]], "matches() (datacompy.base.basecompare method)": [[0, "datacompy.base.BaseCompare.matches", false]], "matches() (datacompy.basecompare method)": [[0, "datacompy.BaseCompare.matches", false]], "matches() (datacompy.compare method)": [[0, "datacompy.Compare.matches", false]], "matches() (datacompy.core.compare method)": [[0, "datacompy.core.Compare.matches", false]], "matches() (datacompy.polars.polarscompare method)": [[0, "datacompy.polars.PolarsCompare.matches", false]], "matches() (datacompy.polarscompare method)": [[0, "datacompy.PolarsCompare.matches", false]], "matches() (datacompy.spark.pandas.sparkpandascompare method)": [[1, "datacompy.spark.pandas.SparkPandasCompare.matches", false]], "matches() (datacompy.spark.sql.sparksqlcompare method)": [[1, "datacompy.spark.sql.SparkSQLCompare.matches", false]], "matches() (datacompy.sparkpandascompare method)": [[0, "datacompy.SparkPandasCompare.matches", false]], "matches() (datacompy.sparksqlcompare method)": [[0, "datacompy.SparkSQLCompare.matches", false]], "matchtype (class in datacompy.spark.legacy)": [[1, "datacompy.spark.legacy.MatchType", false]], "mismatch (datacompy.spark.legacy.matchtype attribute)": [[1, "datacompy.spark.legacy.MatchType.MISMATCH", false]], "module": [[0, "module-datacompy", false], [0, "module-datacompy.base", false], [0, "module-datacompy.core", false], [0, "module-datacompy.fugue", false], [0, "module-datacompy.polars", false], [1, "module-datacompy.spark", false], [1, "module-datacompy.spark.legacy", false], [1, "module-datacompy.spark.pandas", false], [1, "module-datacompy.spark.sql", false]], "polarscompare (class in datacompy)": [[0, "datacompy.PolarsCompare", false]], "polarscompare (class in datacompy.polars)": [[0, "datacompy.polars.PolarsCompare", false]], "render() (in module datacompy)": [[0, "datacompy.render", false]], "render() (in module datacompy.core)": [[0, "datacompy.core.render", false]], "render() (in module datacompy.polars)": [[0, "datacompy.polars.render", false]], "render() (in module datacompy.spark.pandas)": [[1, "datacompy.spark.pandas.render", false]], "render() (in module datacompy.spark.sql)": [[1, "datacompy.spark.sql.render", false]], "report() (datacompy.base.basecompare method)": [[0, "datacompy.base.BaseCompare.report", false]], "report() (datacompy.basecompare method)": [[0, "datacompy.BaseCompare.report", false]], "report() (datacompy.compare method)": [[0, "datacompy.Compare.report", false]], "report() (datacompy.core.compare method)": [[0, "datacompy.core.Compare.report", false]], "report() (datacompy.polars.polarscompare method)": [[0, "datacompy.polars.PolarsCompare.report", false]], "report() (datacompy.polarscompare method)": [[0, "datacompy.PolarsCompare.report", false]], "report() (datacompy.spark.legacy.legacysparkcompare method)": [[1, "datacompy.spark.legacy.LegacySparkCompare.report", false]], "report() (datacompy.spark.pandas.sparkpandascompare method)": [[1, "datacompy.spark.pandas.SparkPandasCompare.report", false]], "report() (datacompy.spark.sql.sparksqlcompare method)": [[1, "datacompy.spark.sql.SparkSQLCompare.report", false]], "report() (datacompy.sparkpandascompare method)": [[0, "datacompy.SparkPandasCompare.report", false]], "report() (datacompy.sparksqlcompare method)": [[0, "datacompy.SparkSQLCompare.report", false]], "report() (in module datacompy)": [[0, "datacompy.report", false]], "report() (in module datacompy.fugue)": [[0, "datacompy.fugue.report", false]], "rows_both_all (datacompy.spark.legacy.legacysparkcompare property)": [[1, "datacompy.spark.legacy.LegacySparkCompare.rows_both_all", false]], "rows_both_mismatch (datacompy.spark.legacy.legacysparkcompare property)": [[1, "datacompy.spark.legacy.LegacySparkCompare.rows_both_mismatch", false]], "rows_only_base (datacompy.spark.legacy.legacysparkcompare property)": [[1, "datacompy.spark.legacy.LegacySparkCompare.rows_only_base", false]], "rows_only_compare (datacompy.spark.legacy.legacysparkcompare property)": [[1, "datacompy.spark.legacy.LegacySparkCompare.rows_only_compare", false]], "sample_mismatch() (datacompy.base.basecompare method)": [[0, "datacompy.base.BaseCompare.sample_mismatch", false]], "sample_mismatch() (datacompy.basecompare method)": [[0, "datacompy.BaseCompare.sample_mismatch", false]], "sample_mismatch() (datacompy.compare method)": [[0, "datacompy.Compare.sample_mismatch", false]], "sample_mismatch() (datacompy.core.compare method)": [[0, "datacompy.core.Compare.sample_mismatch", false]], "sample_mismatch() (datacompy.polars.polarscompare method)": [[0, "datacompy.polars.PolarsCompare.sample_mismatch", false]], "sample_mismatch() (datacompy.polarscompare method)": [[0, "datacompy.PolarsCompare.sample_mismatch", false]], "sample_mismatch() (datacompy.spark.pandas.sparkpandascompare method)": [[1, "datacompy.spark.pandas.SparkPandasCompare.sample_mismatch", false]], "sample_mismatch() (datacompy.spark.sql.sparksqlcompare method)": [[1, "datacompy.spark.sql.SparkSQLCompare.sample_mismatch", false]], "sample_mismatch() (datacompy.sparkpandascompare method)": [[0, "datacompy.SparkPandasCompare.sample_mismatch", false]], "sample_mismatch() (datacompy.sparksqlcompare method)": [[0, "datacompy.SparkSQLCompare.sample_mismatch", false]], "sparkpandascompare (class in datacompy)": [[0, "datacompy.SparkPandasCompare", false]], "sparkpandascompare (class in datacompy.spark.pandas)": [[1, "datacompy.spark.pandas.SparkPandasCompare", false]], "sparksqlcompare (class in datacompy)": [[0, "datacompy.SparkSQLCompare", false]], "sparksqlcompare (class in datacompy.spark.sql)": [[1, "datacompy.spark.sql.SparkSQLCompare", false]], "subset() (datacompy.base.basecompare method)": [[0, "datacompy.base.BaseCompare.subset", false]], "subset() (datacompy.basecompare method)": [[0, "datacompy.BaseCompare.subset", false]], "subset() (datacompy.compare method)": [[0, "datacompy.Compare.subset", false]], "subset() (datacompy.core.compare method)": [[0, "datacompy.core.Compare.subset", false]], "subset() (datacompy.polars.polarscompare method)": [[0, "datacompy.polars.PolarsCompare.subset", false]], "subset() (datacompy.polarscompare method)": [[0, "datacompy.PolarsCompare.subset", false]], "subset() (datacompy.spark.pandas.sparkpandascompare method)": [[1, "datacompy.spark.pandas.SparkPandasCompare.subset", false]], "subset() (datacompy.spark.sql.sparksqlcompare method)": [[1, "datacompy.spark.sql.SparkSQLCompare.subset", false]], "subset() (datacompy.sparkpandascompare method)": [[0, "datacompy.SparkPandasCompare.subset", false]], "subset() (datacompy.sparksqlcompare method)": [[0, "datacompy.SparkSQLCompare.subset", false]], "temp_column_name() (in module datacompy)": [[0, "datacompy.temp_column_name", false]], "temp_column_name() (in module datacompy.base)": [[0, "datacompy.base.temp_column_name", false]], "unq_columns() (in module datacompy)": [[0, "datacompy.unq_columns", false]], "unq_columns() (in module datacompy.fugue)": [[0, "datacompy.fugue.unq_columns", false]]}, "objects": {"": [[0, 0, 0, "-", "datacompy"]], "datacompy": [[0, 1, 1, "", "BaseCompare"], [0, 1, 1, "", "Compare"], [0, 1, 1, "", "PolarsCompare"], [0, 1, 1, "", "SparkPandasCompare"], [0, 1, 1, "", "SparkSQLCompare"], [0, 4, 1, "", "all_columns_match"], [0, 4, 1, "", "all_rows_overlap"], [0, 0, 0, "-", "base"], [0, 4, 1, "", "calculate_max_diff"], [0, 4, 1, "", "columns_equal"], [0, 4, 1, "", "compare_string_and_date_columns"], [0, 0, 0, "-", "core"], [0, 4, 1, "", "count_matching_rows"], [0, 0, 0, "-", "fugue"], [0, 4, 1, "", "generate_id_within_group"], [0, 4, 1, "", "get_merged_columns"], [0, 4, 1, "", "intersect_columns"], [0, 4, 1, "", "is_match"], [0, 0, 0, "-", "polars"], [0, 4, 1, "", "render"], [0, 4, 1, "", "report"], [1, 0, 0, "-", "spark"], [0, 4, 1, "", "temp_column_name"], [0, 4, 1, "", "unq_columns"]], "datacompy.BaseCompare": [[0, 2, 1, "", "all_columns_match"], [0, 2, 1, "", "all_mismatch"], [0, 2, 1, "", "all_rows_overlap"], [0, 2, 1, "", "count_matching_rows"], [0, 3, 1, "", "df1"], [0, 2, 1, "", "df1_unq_columns"], [0, 3, 1, "", "df2"], [0, 2, 1, "", "df2_unq_columns"], [0, 2, 1, "", "intersect_columns"], [0, 2, 1, "", "intersect_rows_match"], [0, 2, 1, "", "matches"], [0, 2, 1, "", "report"], [0, 2, 1, "", "sample_mismatch"], [0, 2, 1, "", "subset"]], "datacompy.Compare": [[0, 2, 1, "", "all_columns_match"], [0, 2, 1, "", "all_mismatch"], [0, 2, 1, "", "all_rows_overlap"], [0, 2, 1, "", "count_matching_rows"], [0, 3, 1, "", "df1"], [0, 2, 1, "", "df1_unq_columns"], [0, 3, 1, "", "df2"], [0, 2, 1, "", "df2_unq_columns"], [0, 2, 1, "", "intersect_columns"], [0, 2, 1, "", "intersect_rows_match"], [0, 2, 1, "", "matches"], [0, 2, 1, "", "report"], [0, 2, 1, "", "sample_mismatch"], [0, 2, 1, "", "subset"]], "datacompy.PolarsCompare": [[0, 2, 1, "", "all_columns_match"], [0, 2, 1, "", "all_mismatch"], [0, 2, 1, "", "all_rows_overlap"], [0, 2, 1, "", "count_matching_rows"], [0, 3, 1, "", "df1"], [0, 2, 1, "", "df1_unq_columns"], [0, 3, 1, "", "df2"], [0, 2, 1, "", "df2_unq_columns"], [0, 2, 1, "", "intersect_columns"], [0, 2, 1, "", "intersect_rows_match"], [0, 2, 1, "", "matches"], [0, 2, 1, "", "report"], [0, 2, 1, "", "sample_mismatch"], [0, 2, 1, "", "subset"]], "datacompy.SparkPandasCompare": [[0, 2, 1, "", "all_columns_match"], [0, 2, 1, "", "all_mismatch"], [0, 2, 1, "", "all_rows_overlap"], [0, 2, 1, "", "count_matching_rows"], [0, 3, 1, "", "df1"], [0, 2, 1, "", "df1_unq_columns"], [0, 3, 1, "", "df2"], [0, 2, 1, "", "df2_unq_columns"], [0, 2, 1, "", "intersect_columns"], [0, 2, 1, "", "intersect_rows_match"], [0, 2, 1, "", "matches"], [0, 2, 1, "", "report"], [0, 2, 1, "", "sample_mismatch"], [0, 2, 1, "", "subset"]], "datacompy.SparkSQLCompare": [[0, 2, 1, "", "all_columns_match"], [0, 2, 1, "", "all_mismatch"], [0, 2, 1, "", "all_rows_overlap"], [0, 2, 1, "", "count_matching_rows"], [0, 3, 1, "", "df1"], [0, 2, 1, "", "df1_unq_columns"], [0, 3, 1, "", "df2"], [0, 2, 1, "", "df2_unq_columns"], [0, 2, 1, "", "intersect_columns"], [0, 2, 1, "", "intersect_rows_match"], [0, 2, 1, "", "matches"], [0, 2, 1, "", "report"], [0, 2, 1, "", "sample_mismatch"], [0, 2, 1, "", "subset"]], "datacompy.base": [[0, 1, 1, "", "BaseCompare"], [0, 4, 1, "", "temp_column_name"]], "datacompy.base.BaseCompare": [[0, 2, 1, "", "all_columns_match"], [0, 2, 1, "", "all_mismatch"], [0, 2, 1, "", "all_rows_overlap"], [0, 2, 1, "", "count_matching_rows"], [0, 3, 1, "", "df1"], [0, 2, 1, "", "df1_unq_columns"], [0, 3, 1, "", "df2"], [0, 2, 1, "", "df2_unq_columns"], [0, 2, 1, "", "intersect_columns"], [0, 2, 1, "", "intersect_rows_match"], [0, 2, 1, "", "matches"], [0, 2, 1, "", "report"], [0, 2, 1, "", "sample_mismatch"], [0, 2, 1, "", "subset"]], "datacompy.core": [[0, 1, 1, "", "Compare"], [0, 4, 1, "", "calculate_max_diff"], [0, 4, 1, "", "columns_equal"], [0, 4, 1, "", "compare_string_and_date_columns"], [0, 4, 1, "", "generate_id_within_group"], [0, 4, 1, "", "get_merged_columns"], [0, 4, 1, "", "render"]], "datacompy.core.Compare": [[0, 2, 1, "", "all_columns_match"], [0, 2, 1, "", "all_mismatch"], [0, 2, 1, "", "all_rows_overlap"], [0, 2, 1, "", "count_matching_rows"], [0, 3, 1, "", "df1"], [0, 2, 1, "", "df1_unq_columns"], [0, 3, 1, "", "df2"], [0, 2, 1, "", "df2_unq_columns"], [0, 2, 1, "", "intersect_columns"], [0, 2, 1, "", "intersect_rows_match"], [0, 2, 1, "", "matches"], [0, 2, 1, "", "report"], [0, 2, 1, "", "sample_mismatch"], [0, 2, 1, "", "subset"]], "datacompy.fugue": [[0, 4, 1, "", "all_columns_match"], [0, 4, 1, "", "all_rows_overlap"], [0, 4, 1, "", "count_matching_rows"], [0, 4, 1, "", "intersect_columns"], [0, 4, 1, "", "is_match"], [0, 4, 1, "", "report"], [0, 4, 1, "", "unq_columns"]], "datacompy.polars": [[0, 1, 1, "", "PolarsCompare"], [0, 4, 1, "", "calculate_max_diff"], [0, 4, 1, "", "columns_equal"], [0, 4, 1, "", "compare_string_and_date_columns"], [0, 4, 1, "", "generate_id_within_group"], [0, 4, 1, "", "get_merged_columns"], [0, 4, 1, "", "render"]], "datacompy.polars.PolarsCompare": [[0, 2, 1, "", "all_columns_match"], [0, 2, 1, "", "all_mismatch"], [0, 2, 1, "", "all_rows_overlap"], [0, 2, 1, "", "count_matching_rows"], [0, 3, 1, "", "df1"], [0, 2, 1, "", "df1_unq_columns"], [0, 3, 1, "", "df2"], [0, 2, 1, "", "df2_unq_columns"], [0, 2, 1, "", "intersect_columns"], [0, 2, 1, "", "intersect_rows_match"], [0, 2, 1, "", "matches"], [0, 2, 1, "", "report"], [0, 2, 1, "", "sample_mismatch"], [0, 2, 1, "", "subset"]], "datacompy.spark": [[1, 0, 0, "-", "legacy"], [1, 0, 0, "-", "pandas"], [1, 0, 0, "-", "sql"]], "datacompy.spark.legacy": [[1, 1, 1, "", "LegacySparkCompare"], [1, 1, 1, "", "MatchType"], [1, 4, 1, "", "decimal_comparator"]], "datacompy.spark.legacy.LegacySparkCompare": [[1, 3, 1, "", "base_row_count"], [1, 3, 1, "", "columns_compared"], [1, 3, 1, "", "columns_in_both"], [1, 3, 1, "", "columns_only_base"], [1, 3, 1, "", "columns_only_compare"], [1, 3, 1, "", "common_row_count"], [1, 3, 1, "", "compare_row_count"], [1, 2, 1, "", "report"], [1, 3, 1, "", "rows_both_all"], [1, 3, 1, "", "rows_both_mismatch"], [1, 3, 1, "", "rows_only_base"], [1, 3, 1, "", "rows_only_compare"]], "datacompy.spark.legacy.MatchType": [[1, 5, 1, "", "KNOWN_DIFFERENCE"], [1, 5, 1, "", "MATCH"], [1, 5, 1, "", "MISMATCH"]], "datacompy.spark.pandas": [[1, 1, 1, "", "SparkPandasCompare"], [1, 4, 1, "", "calculate_max_diff"], [1, 4, 1, "", "columns_equal"], [1, 4, 1, "", "compare_string_and_date_columns"], [1, 4, 1, "", "generate_id_within_group"], [1, 4, 1, "", "get_merged_columns"], [1, 4, 1, "", "render"]], "datacompy.spark.pandas.SparkPandasCompare": [[1, 2, 1, "", "all_columns_match"], [1, 2, 1, "", "all_mismatch"], [1, 2, 1, "", "all_rows_overlap"], [1, 2, 1, "", "count_matching_rows"], [1, 3, 1, "", "df1"], [1, 2, 1, "", "df1_unq_columns"], [1, 3, 1, "", "df2"], [1, 2, 1, "", "df2_unq_columns"], [1, 2, 1, "", "intersect_columns"], [1, 2, 1, "", "intersect_rows_match"], [1, 2, 1, "", "matches"], [1, 2, 1, "", "report"], [1, 2, 1, "", "sample_mismatch"], [1, 2, 1, "", "subset"]], "datacompy.spark.sql": [[1, 1, 1, "", "SparkSQLCompare"], [1, 4, 1, "", "calculate_max_diff"], [1, 4, 1, "", "calculate_null_diff"], [1, 4, 1, "", "columns_equal"], [1, 4, 1, "", "decimal_comparator"], [1, 4, 1, "", "get_merged_columns"], [1, 4, 1, "", "render"]], "datacompy.spark.sql.SparkSQLCompare": [[1, 2, 1, "", "all_columns_match"], [1, 2, 1, "", "all_mismatch"], [1, 2, 1, "", "all_rows_overlap"], [1, 2, 1, "", "count_matching_rows"], [1, 3, 1, "", "df1"], [1, 2, 1, "", "df1_unq_columns"], [1, 3, 1, "", "df2"], [1, 2, 1, "", "df2_unq_columns"], [1, 2, 1, "", "intersect_columns"], [1, 2, 1, "", "intersect_rows_match"], [1, 2, 1, "", "matches"], [1, 2, 1, "", "report"], [1, 2, 1, "", "sample_mismatch"], [1, 2, 1, "", "subset"]]}, "objnames": {"0": ["py", "module", "Python module"], "1": ["py", "class", "Python class"], "2": ["py", "method", "Python method"], "3": ["py", "property", "Python property"], "4": ["py", "function", "Python function"], "5": ["py", "attribute", "Python attribute"]}, "objtypes": {"0": "py:module", "1": "py:class", "2": "py:method", "3": "py:property", "4": "py:function", "5": "py:attribute"}, "terms": {"": [0, 1, 6, 8, 9, 10], "0": [0, 1, 3, 4, 5, 6, 8, 9, 10], "000": [3, 8, 9, 10], "0000": [8, 9, 10], "0001": [8, 9], "0005": [8, 9, 10], "01": [5, 8, 9, 10], "025": 3, "041": 3, "05": [5, 8, 9, 10], "0500": [8, 9, 10], "0701": 3, "1": [0, 1, 3, 4, 5, 6, 8, 9, 10], "10": [0, 1, 3, 5, 6, 8, 9, 10], "100": [1, 3], "1000": 3, "10000001234": [5, 8, 9, 10], "10000001235": [5, 8, 9, 10], "10000001236": [5, 8, 9, 10], "10000001237": [5, 8, 9, 10], "10000001238": [5, 8, 9, 10], "10000001239": [5, 10], "109": 3, "11": [3, 6, 9], "111": [5, 8, 9, 10], "1113": 3, "12": [5, 6, 7, 8, 9, 10], "120": 3, "123": [5, 8, 9, 10], "123456": [5, 8, 9, 10], "1257": 3, "127": 3, "13": [6, 10], "130": 3, "1345": [5, 8, 9, 10], "14": [0, 6, 10], "14530": [5, 8, 9, 10], "15": 3, "155": [5, 8, 9, 10], "1555": [5, 8, 9, 10], "16": 3, "17": 3, "175": 3, "18": 3, "193": 3, "194": 3, "196": 3, "2": [0, 1, 3, 6, 8, 9, 10], "20": 3, "2017": [5, 8, 9, 10], "21": 4, "2185": 3, "234": 3, "262": 3, "2763": 3, "2838": 3, "3": [3, 4, 6, 7, 8, 9, 10], "304": 3, "31": 3, "3112": 3, "3204": 3, "32gb": 3, "330": 3, "345": [5, 8, 9, 10], "4": [5, 6, 8, 9, 10], "45": [5, 8, 9, 10], "455": 3, "47": 3, "494": 3, "5": [4, 6, 8, 9, 10], "50": 3, "500": 3, "560": 3, "57": 3, "5735": 3, "578": 3, "6": [3, 4, 8, 9, 10], "6094": 3, "62": 3, "6274": 3, "64gb": 3, "7": [4, 8], "743": 3, "8": [1, 3, 9], "804": 3, "827": 3, "9": [6, 7], "90": 3, "94": 3, "96": 3, "9814": 3, "A": [0, 1, 4, 7, 8, 9, 10], "And": [8, 10], "As": [0, 9], "At": 6, "By": [1, 6], "For": [4, 5, 8, 9, 10], "If": [0, 1, 3, 6, 7, 8, 10], "In": [4, 5, 8], "It": [3, 4, 6, 8, 10], "No": 10, "OR": [8, 9], "The": [0, 1, 4, 5, 6, 8, 9, 10], "Then": [0, 4, 6], "There": [8, 9, 10], "To": [6, 10], "Will": [0, 1], "With": [5, 6, 10], "_df1": [0, 1], "_io": 1, "_merge_left": 10, "_merge_right": 10, "_temp_x": 0, "ab": [0, 1], "abc": 0, "abl": 3, "about": [4, 8], "abov": [4, 6, 7, 8, 9, 10], "abs_tol": [0, 1, 5, 8, 9, 10], "absolut": [0, 1, 8, 9, 10], "abstract": 0, "accept": [6, 10], "access": 5, "acct_id": [5, 8, 9, 10], "acct_id_df1": 10, "acct_id_df2": 10, "accur": [0, 6], "achiev": 5, "across": [5, 6], "action": 4, "activ": [4, 7], "actual": [0, 1], "ad": [0, 1, 4], "add": 7, "addit": 4, "adher": 6, "adopt": 5, "after": [4, 8, 9, 10], "again": [8, 10], "against": 1, "aggreg": 5, "agreement": 6, "align": [6, 10], "all": [0, 1, 4, 6, 7, 8, 9, 10], "all_columns_match": [0, 1, 2, 5, 6], "all_mismatch": [0, 1, 2], "all_rows_overlap": [0, 1, 2, 5, 6], "allow": [0, 1], "alreadi": [1, 8], "also": [1, 4, 5, 6, 8, 9, 10], "alwai": 3, "amount": [0, 1, 3], "an": [0, 1, 3, 9], "ani": [0, 1, 4, 6, 8, 9, 10], "anoth": [0, 1], "anydatafram": 0, "apach": 9, "api": [4, 10], "apidoc": 4, "append": [0, 1], "appli": [0, 1], "appreci": 6, "ar": [0, 1, 4, 5, 6, 7, 8, 9, 10], "archiv": 6, "arr1": 8, "arr2": 8, "arrow": [5, 6, 9], "artifact": 4, "ask": 6, "assert_almost_equ": 8, "assert_array_equ": 8, "assert_frame_equ": 8, "assert_series_equ": 8, "attempt": [0, 1], "attribut": 10, "autom": 4, "automag": [0, 1], "automat": 4, "avail": [8, 9, 10], "awar": 9, "b": 1, "back": 4, "backend": 5, "background": 5, "base": [1, 2, 3, 4, 5, 6, 8], "base_column_nam": 1, "base_df": 1, "base_row_count": [0, 1], "basecompar": [0, 1, 2, 6], "basi": 1, "basic": [0, 1, 6], "been": [6, 8, 9, 10], "befor": [0, 1, 4, 6, 8, 10], "behaviour": [6, 9, 10], "behind": [4, 8, 10], "being": [1, 4], "below": [4, 6], "benchmark": 6, "benefit": 5, "best": 3, "better": [6, 10], "between": [0, 1, 8], "bias": 3, "bin": 7, "black": 4, "bluth": [5, 8, 9, 10], "bob": [5, 8, 9, 10], "bool": [0, 1, 9], "boolean": [0, 1], "both": [0, 1], "boto3": 4, "branch": 4, "break": 4, "build": 4, "builder": [5, 10], "c": 4, "cach": 1, "cache_intermedi": 1, "calculate_max_diff": [0, 1, 2, 6], "calculate_null_diff": [0, 1], "call": [8, 9, 10], "can": [0, 1, 3, 4, 5, 6, 8, 9, 10], "canon": 1, "capabl": 8, "carri": [0, 6], "case": [0, 1, 5], "cast": [0, 1], "cast_column_names_low": [0, 1], "caus": 1, "caveat": 6, "certain": 1, "chang": 4, "channel": 7, "check": [0, 1, 8], "checkout": 4, "choic": 8, "chunk": 5, "cla": 6, "class": [0, 1, 5, 6, 8, 10], "clean": 4, "coars": 5, "code": [4, 5, 6, 9], "cogroup": 5, "col_1": [0, 1], "col_2": [0, 1], "col_match": 1, "collaps": 4, "collect": 4, "column": [0, 1, 3, 5, 8, 9, 10], "column_count": [0, 1], "column_map": 1, "columnar": 9, "columns_compar": [0, 1], "columns_equ": [0, 1, 2, 6], "columns_in_both": [0, 1], "columns_map": 1, "columns_only_bas": [0, 1], "columns_only_compar": [0, 1], "combin": [8, 10], "come": [4, 8, 9], "command": [0, 1, 4], "commit": 6, "common": [1, 8, 9, 10], "common_row_count": [0, 1], "commun": [4, 5], "compar": [0, 1, 2, 3, 6, 10], "compare_column_nam": 1, "compare_df": 1, "compare_row_count": [0, 1], "compare_string_and_date_column": [0, 1, 2, 6], "comparin": 1, "comparison": [0, 1, 5, 8, 9, 10], "compat": [5, 6], "compris": 1, "conda": 6, "conduct": 6, "config": 7, "configur": 4, "consid": [0, 1, 9], "consist": [1, 3, 5, 6, 10], "constraint": 8, "contain": [0, 1, 8], "content": 2, "continu": [6, 10], "contribut": [3, 6], "control": [0, 1], "conveni": 6, "convent": 1, "convert": [0, 1, 8], "core": [2, 3, 4, 6], "correspond": [4, 5], "could": 8, "count": [0, 1], "count_matching_row": [0, 1, 2, 6], "cpu": 3, "creat": [0, 1, 3, 7], "createdatafram": [5, 10], "creation": [0, 1], "cross": 6, "current": [6, 8, 10], "dai": 4, "dask": [5, 6], "data": [0, 1, 5, 6, 8], "data1": [5, 8, 9, 10], "data2": [5, 8, 9, 10], "datacompi": [4, 5, 7, 8, 9, 10], "datacompy_nul": 8, "datafram": [0, 1, 3, 5, 6, 8, 9, 10], "dataset": [1, 3, 5, 8], "date": [0, 1, 4], "date_fld": [5, 8, 9, 10], "date_fld_df1": 10, "de": 1, "decim": [0, 1], "decimal_compar": [0, 1], "decis": 4, "dedup": 1, "dedupl": [0, 1], "default": [0, 1, 4, 5, 10], "defin": [1, 4], "denot": [1, 4], "depend": [4, 5, 6], "dependneci": 10, "deprec": [5, 10], "describ": [1, 8], "detail": [4, 6], "dev": 4, "develop": 6, "df1": [0, 1, 2, 5, 8, 9, 10], "df1_name": [0, 1, 5, 8, 9, 10], "df1_unq_column": [0, 1, 2, 8, 9, 10], "df1_unq_row": [0, 1, 8, 9, 10], "df2": [0, 1, 2, 5, 8, 9, 10], "df2_name": [0, 1, 5, 8, 9, 10], "df2_unq_column": [0, 1, 2, 8, 9, 10], "df2_unq_row": [0, 1, 8, 9, 10], "dict": 1, "dictionari": 1, "did": 3, "diff": [1, 8, 9, 10], "differ": [0, 1, 5, 6, 8, 9, 10], "directli": 8, "directori": [0, 1, 4], "disconnect": 4, "disk": 8, "displai": [0, 1], "dist": 4, "distinguish": [0, 1], "distribut": [3, 6], "dnr": 3, "do": [1, 5], "doc": 4, "docstr": 4, "document": [6, 9], "doe": [8, 9, 10], "dollar_amt": [5, 8, 9, 10], "dollar_amt_df1": 10, "dollar_amt_df2": 10, "don": [0, 1, 8, 9, 10], "done": [1, 3, 10], "drop": [8, 10], "dtype": [8, 9, 10], "duckdb": [5, 6], "due": [3, 6, 9, 10], "dupe": 1, "duplic": 6, "e": [0, 1, 4], "each": [0, 1, 4, 5, 8, 10], "easier": 4, "easili": [0, 1], "edgetest": 6, "empti": 8, "encod": 1, "endless": 4, "engin": 9, "ensur": 4, "enter": 0, "enum": 1, "env": 7, "environ": [4, 7], "equal": [0, 1, 6, 8, 9, 10], "equival": 5, "evalu": [0, 1], "exact": [0, 1], "exactli": [0, 5, 8], "exampl": [1, 5, 8, 10], "excel": 4, "except": [0, 1], "exclud": 1, "execut": [0, 1, 4], "executor": 3, "exist": [0, 1], "expect": 6, "experi": 3, "experiment": 9, "export": 4, "extend": [0, 1, 6], "extra": 4, "f64": 9, "fail": [0, 8], "fals": [0, 1, 5, 8, 9, 10], "fast": [0, 3], "favour": 5, "featur": 4, "feedback": 5, "few": [8, 9, 10], "field": [0, 1, 8], "file": [0, 1], "filehandl": 1, "filenam": [0, 1], "fill": 8, "final": [4, 5], "fine": [6, 7], "first": [0, 1, 4, 8, 9, 10], "fit": 8, "flag": [0, 1], "float": [0, 1], "float64": [8, 9, 10], "float_fld": [5, 8, 9, 10], "float_fld_df1": 10, "float_fld_df2": 10, "folder": 4, "follow": [4, 5, 9], "for_displai": [0, 1], "forc": 0, "forg": 6, "form": 1, "format": [0, 1, 9], "forward": [3, 6, 10], "found": 6, "frame": [0, 1], "framework": 5, "from": [0, 1, 3, 4, 5, 6, 8, 9, 10], "fugu": [2, 3, 6], "full": 5, "fulli": [0, 1], "functioanl": [6, 7], "function": [0, 1, 5, 6, 9], "further": 3, "futur": [4, 6], "gather": 5, "gener": [0, 1, 3, 6, 8, 9, 10], "generate_id_within_group": [0, 1, 2, 6], "georg": [5, 8, 9, 10], "get": [0, 1, 5], "get_merged_column": [0, 1, 2, 6], "getorcr": [5, 10], "gh": 4, "ghpage": 4, "git": 4, "github": [4, 6], "given": 1, "go": [0, 1, 4], "goal": 8, "gold": 1, "good": 9, "googl": 4, "grain": 3, "great": 5, "group": [0, 1, 8, 10], "grow": 0, "guarante": 5, "guid": 6, "guidanc": 4, "gz": 4, "ha": [4, 6, 8, 9, 10], "handl": [0, 1, 3, 8, 9, 10], "hard": 3, "have": [0, 1, 3, 4, 5, 6, 8, 9, 10], "help": [3, 4], "helper": 4, "here": [4, 6, 8, 9, 10], "highli": 7, "honor": 6, "hook": 6, "hope": 5, "how": [0, 3, 4, 6], "html": [0, 1, 4], "html_file": [0, 1], "http": 4, "human": [0, 1, 5, 8, 10], "i": [0, 1, 3, 4, 5, 6, 7, 8, 9, 10], "i64": 9, "id": [0, 1, 3, 8, 10], "idea": 3, "ident": [0, 1], "identifi": [0, 1], "ignor": [0, 1], "ignore_cas": [0, 1], "ignore_extra_column": [0, 1, 10], "ignore_matching_col": [0, 1], "ignore_spac": [0, 1], "implement": [3, 5, 6, 9, 10], "implementaion": 3, "import": [5, 6, 8, 9, 10], "improv": 3, "includ": [0, 1, 4], "increas": 3, "independ": 4, "index": [0, 1, 6, 8, 9], "indic": [0, 1], "individu": [0, 1], "initi": 8, "input": 1, "instal": [4, 5], "instanc": [1, 8, 9, 10], "instanti": 1, "instead": [0, 1], "instruct": 6, "int": [0, 1], "integ": 0, "integr": [5, 6], "interact": 6, "interfac": [5, 6, 9], "intermedi": 1, "intersect": [0, 1], "intersect_column": [0, 1, 2, 5, 6, 8, 9, 10], "intersect_row": [0, 1, 8, 9, 10], "intersect_rows_match": [0, 1, 2], "introduc": [6, 10], "io": [5, 8, 9, 10], "is_match": [0, 2, 5, 6], "isclos": [0, 1], "isn": 0, "isort": 4, "issu": [3, 6, 10], "its": [0, 1, 3, 6], "join": [0, 1, 3, 5, 8, 9, 10], "join_column": [0, 1, 5, 8, 9, 10], "join_nul": 9, "just": [0, 1, 4, 5, 6, 9], "keep": [4, 6, 10], "kei": 1, "kinda": [0, 1], "know": 8, "known": 1, "known_differ": [0, 1], "larg": [1, 3, 8], "lazi": 1, "legaci": [0, 2, 4, 10], "legacysparkcompar": [0, 1, 6, 10], "let": [0, 4, 6], "level": 6, "librari": [5, 6], "licens": 6, "like": [0, 4, 5, 6, 8, 9, 10], "limit": 6, "list": [0, 1, 5, 8, 9, 10], "ll": 4, "loblaw": [5, 8, 9, 10], "local": 4, "logic": [6, 10], "look": [0, 1, 8], "loos": [5, 8, 9, 10], "lot": [3, 8], "lower": [0, 1], "lowest": 6, "lucil": [5, 8, 9, 10], "m": 4, "machin": [3, 4], "mahari": [5, 8, 9, 10], "mai": [5, 8, 9], "main": [4, 8], "maintain": 5, "make": [1, 3, 4, 6], "makefil": 4, "manag": [5, 6], "mani": [5, 6], "map": 5, "match": [0, 1, 2, 6, 8, 9, 10], "match_rat": 1, "matchin": 0, "matchtyp": [0, 1], "matrix": 6, "max": [1, 8, 9, 10], "maximum": [0, 1], "mean": [3, 6], "meant": [0, 1], "medium": 3, "mediumish": 3, "memori": [1, 8, 9], "mention": 9, "merg": [0, 1, 4, 8, 10], "merged_df": [0, 1], "messag": 4, "method": [5, 6], "michael": [5, 8, 9, 10], "might": 9, "migrat": 9, "million": 3, "minim": 3, "mismatch": [0, 1], "mix": 0, "mode": 1, "model": 9, "modul": [2, 6, 10], "montonicli": 3, "more": [0, 1, 4, 6, 8, 10], "most": [3, 4], "move": [3, 6, 10], "much": [4, 6, 10], "multipl": 1, "must": [0, 4, 5, 9], "my_report": 1, "name": [0, 1, 5, 7, 8, 9, 10], "name_df1": [8, 9, 10], "name_df2": [8, 9, 10], "name_match": [8, 9, 10], "nan": [0, 1, 8, 9, 10], "nativ": [3, 5, 6, 10], "natur": 3, "na\u00efv": 8, "need": [4, 5, 8], "new": [0, 1, 4, 5, 6, 8, 9, 10], "newlin": [0, 1], "nice": [0, 1], "non": [0, 1, 5], "none": [0, 1, 4], "note": [0, 1, 4, 5, 6, 7, 8, 9, 10], "notic": 5, "now": [6, 10], "np": [0, 1], "npt": 8, "null": [0, 1, 8, 9, 10], "number": [0, 1, 3, 8, 9, 10], "numer": [0, 1, 3], "numpi": [4, 6, 8, 10], "obj1": 8, "obj2": 8, "object": [1, 6, 10], "obsolet": 3, "offici": 4, "olap": 9, "old": [6, 10], "on_index": [0, 8, 10], "onc": 4, "one": [0, 1, 4, 9, 10], "onli": [0, 1, 4, 8, 9, 10], "open": [0, 1, 6], "oper": [0, 1, 5, 8], "option": [0, 1, 4, 5, 10], "order": [0, 1, 4, 5], "orderedset": [0, 1, 9, 10], "org": 4, "origin": [0, 1, 5, 6, 8, 9, 10], "original_df": [0, 1], "orphan": 4, "other": [0, 1, 4, 5, 6, 8, 10], "otherwis": 1, "our": 3, "out": [0, 1, 4, 5, 6, 10], "output": [0, 1, 4, 8], "over": [0, 6], "overlap": [0, 1], "overview": 6, "overwrit": [0, 1], "p": 10, "packag": [2, 4, 6], "page": [4, 6], "panda": [0, 2, 3, 4, 5, 6, 7, 9, 10], "parallel": [0, 5], "paramet": [0, 1], "particip": 6, "partit": 5, "pass": [0, 1, 4, 5], "pd": [5, 8, 10], "peopl": 4, "per": 4, "perform": [1, 3, 5, 6, 10], "pertin": [0, 1], "pick": 8, "pilot": 5, "pip": [4, 5, 6, 7], "pl": 9, "plan": 6, "pleas": [3, 5, 6, 7, 9], "polar": [2, 3, 5, 6, 7], "polarscompar": [0, 2, 6, 9], "pollut": 4, "port": 9, "post": [0, 1], "pre": [0, 1, 6], "prefer": [6, 10], "preform": 3, "prepend": [0, 1], "present": [0, 1], "prevent": [1, 4], "print": [0, 1, 5, 6, 8, 9, 10], "proc": [0, 1, 6, 8], "process": [3, 4, 5, 6], "produc": 5, "project": [4, 6], "properli": 4, "properti": [0, 1], "proport": 1, "provid": [0, 1, 5, 6, 8, 10], "pure": 3, "push": 4, "py": 4, "py3": 4, "pypi": 6, "pyproject": 4, "pysaprk": [6, 10], "pyspark": [0, 1, 5, 6, 10], "pytest": 4, "python": [4, 5, 6, 7], "pyyaml": 4, "qualiti": 4, "queri": 9, "question": 1, "rai": [5, 6], "rais": 0, "ram": 3, "rang": 3, "rate": 1, "raw": [0, 1], "re": [8, 10], "read": [0, 1], "read_csv": [5, 8, 9, 10], "readabl": [0, 1, 5, 8, 10], "readi": 1, "real": 4, "reason": 4, "recogn": [8, 10], "recommend": 7, "recomput": 1, "record": [0, 1, 3], "redirect": 1, "refer": 1, "regener": 4, "rel": [0, 1, 8, 9, 10], "rel_tol": [0, 1, 5, 8, 9, 10], "relat": 5, "releas": 6, "renam": [6, 10], "render": [0, 1, 2, 4, 6], "replac": [0, 1, 5, 6, 8, 9, 10], "repo": [4, 6], "report": [0, 1, 2, 5, 6], "report_fil": 1, "repositori": 4, "repres": 0, "represent": [0, 1], "requir": 6, "resili": [8, 9], "result": [1, 3, 5, 9], "return": [0, 1, 4, 8, 9, 10], "right": 4, "robert": [5, 8, 9, 10], "root": 4, "row": [0, 1, 3, 6], "rows_both_al": [0, 1], "rows_both_mismatch": [0, 1], "rows_only_bas": [0, 1], "rows_only_compar": [0, 1], "run": [3, 6, 8, 9, 10], "runner": 4, "rust": 9, "sa": [0, 1, 6, 8], "safe": 10, "salt": 3, "same": [0, 1, 5, 8], "sampl": [0, 1, 5, 8, 9, 10], "sample_count": [0, 1], "sample_mismatch": [0, 1, 2], "save": [0, 1], "scene": [8, 10], "schema": 0, "seal": [5, 8, 9, 10], "search": 6, "second": [0, 1, 3, 8, 10], "section": [4, 9], "see": [3, 6, 9], "seem": 3, "semant": [4, 5], "sens": 1, "separ": 8, "seri": [0, 1, 8], "seriestyp": 0, "serv": [1, 4], "set": [0, 1, 4, 8], "setup": [4, 6], "setuptool": 7, "sever": 4, "shape": 9, "share": [0, 1], "shine": 3, "should": [0, 1, 4, 6, 7, 8, 9, 10], "show": [0, 1], "show_all_column": 1, "shown": 1, "sign": 6, "significantli": 1, "similar": [0, 1, 9], "simpl": [4, 5, 6], "sinc": 4, "singl": [3, 4], "size": 1, "skip": [0, 1], "slate": [6, 10], "slightli": 9, "slower": 3, "small": 3, "so": [6, 8, 9, 10], "some": [0, 1, 3, 6, 8, 9, 10], "some_field": 8, "someth": [0, 4, 6], "somewhat": 8, "soon": 4, "sort": 8, "sourc": [6, 7], "spark": [0, 2, 3, 5], "spark_df2": 5, "spark_sess": [0, 1], "sparkcompar": [1, 5, 6, 10], "sparkpandascompar": [0, 1, 2, 10], "sparksess": [0, 1, 5, 10], "sparksqlcompar": [0, 1, 2, 6], "specif": 5, "specifi": [1, 5, 8, 9, 10], "speed": 1, "sphinx": 4, "sql": [0, 2, 3, 5, 6, 10], "squash": 4, "standard": 1, "start": [0, 3, 6, 10], "stat": [0, 6], "statement": 1, "stdout": 1, "step": [1, 8], "still": 4, "store": 4, "str": [0, 1, 9], "streamlin": 4, "strict_schema": 0, "string": [0, 1, 3, 8, 9, 10], "stringio": [5, 8, 9, 10], "strip": [0, 1], "style": 4, "sub": [0, 1], "subfold": 4, "submodul": [2, 6, 10], "subpackag": [2, 6], "subsequ": [6, 10], "subset": [0, 1, 2, 4], "suffix": [0, 1], "summar": [5, 10], "summari": [1, 8, 9, 10], "support": [0, 7, 8, 9, 10], "sure": [4, 6], "sy": 1, "synthet": 3, "t": [0, 1, 8, 9, 10], "tabl": [3, 5, 8, 9, 10], "tag": 4, "take": [1, 3], "taken": 4, "tar": 4, "temp": 0, "temp_column_nam": [0, 2, 6], "temp_id": [8, 10], "templat": [0, 1], "temporari": [0, 8, 10], "test": [6, 7, 8, 10], "textio": 1, "textiowrapp": 1, "than": [0, 5, 6], "thei": [4, 9], "them": 8, "thi": [0, 1, 4, 5, 6, 8, 9, 10], "thing": 9, "third": [8, 10], "though": 5, "time": [3, 6], "tldr": 6, "toler": [0, 1, 8, 9, 10], "toml": 4, "toni": [8, 10], "top": 9, "total": [8, 9, 10], "track": [0, 1], "transform": 1, "treat": 1, "tri": [0, 1, 3, 9], "trigger": [0, 1], "true": [0, 1, 4, 8, 9, 10], "try": [8, 9, 10], "tune": 3, "tupl": 1, "tweak": [0, 6], "twine": 4, "two": [0, 1, 5, 6, 8, 9, 10], "txt": 1, "type": [0, 1, 4, 8, 9, 10], "ultim": 1, "under": [4, 6, 10], "understand": 3, "unequ": [8, 9, 10], "unexpect": 9, "unifi": [5, 6], "uniqu": [0, 1, 8, 10], "unit": 6, "unittest": 4, "unlik": 9, "unq_column": [0, 2, 5, 6], "up": [1, 4, 8], "updat": 4, "upgrad": [4, 7], "upload": 4, "url": 4, "us": [0, 1, 4, 5, 6, 7, 8, 9, 10], "usag": 6, "user": [0, 1, 3, 4], "utf": 1, "util": 4, "v0": [6, 9, 10], "valu": [0, 1, 8, 9, 10], "valueerror": 8, "vanilla": 0, "variabl": [0, 1], "vast": 3, "ve": 3, "veri": [3, 8, 9], "versa": [0, 1], "version": [0, 1, 3, 4, 5, 9, 10], "via": [4, 5, 6], "vice": [0, 1], "virtual": 7, "virtualenv": 6, "w": 1, "wa": [0, 1, 3, 6, 10], "wai": [0, 1, 5, 6], "want": [4, 5], "we": [3, 4, 5, 6, 10], "welcom": [3, 6], "what": [0, 1, 6, 8], "wheel": 4, "when": [0, 1, 3, 4, 8], "where": [0, 1, 4], "whether": [0, 1, 8], "which": [0, 1, 3, 4, 5, 6, 8, 9, 10], "while": 1, "whitespac": [0, 1], "whl": 4, "wide": 1, "wisdom": 4, "wise": [0, 1], "wish": [6, 10], "within": [0, 1, 6, 8, 10], "without": [0, 1], "wonder": [8, 10], "work": [1, 4, 6, 7], "workflow": 4, "world": 1, "would": [1, 6], "write": 1, "x": [0, 1], "y": 1, "ye": [8, 9], "yield": 9, "you": [0, 1, 3, 4, 5, 6, 7, 8, 9, 10], "your": [1, 4, 6, 8, 9, 10], "zero": 0}, "titles": ["datacompy package", "datacompy.spark package", "datacompy", "Benchmarks", "Developer Instructions", "Fugue Detail", "DataComPy", "Installation", "Pandas Usage", "Polars Usage", "Spark Usage"], "titleterms": {"The": 3, "api": 6, "archiv": 4, "backend": 6, "base": 0, "basic": [5, 7, 9], "benchmark": 3, "caveat": [8, 9], "commit": 4, "compar": [5, 8, 9], "conda": 7, "content": [0, 1, 6], "contributor": 6, "conveni": [8, 9, 10], "core": 0, "cross": 5, "data": 3, "datacompi": [0, 1, 2, 6], "depend": 7, "dependnci": 6, "deprec": 6, "detail": 5, "develop": 4, "distribut": 4, "document": 4, "duplic": [8, 9, 10], "edgetest": 4, "extra": 6, "forg": 7, "from": 7, "fugu": [0, 5], "futur": 5, "gener": 4, "guid": 4, "hook": 4, "how": 5, "indic": 6, "instal": [6, 7], "instruct": 4, "legaci": [1, 6], "limit": [8, 9], "manag": 4, "method": [8, 9, 10], "modul": [0, 1], "object": [8, 9], "overview": [8, 9], "packag": [0, 1], "panda": [1, 8], "polar": [0, 9], "pre": 4, "pypi": [4, 7], "quick": 6, "refer": 6, "releas": [4, 5], "report": [8, 9, 10], "requir": 4, "roadmap": 6, "row": [8, 9, 10], "run": 4, "setup": [3, 8, 9], "spark": [1, 6, 10], "sparkpandascompar": 6, "sparksqlcompar": 10, "sql": 1, "submodul": [0, 1], "subpackag": 0, "support": 6, "tabl": 6, "test": 4, "tldr": 3, "unit": 4, "us": 3, "usag": [5, 8, 9, 10], "version": 6, "virtualenv": 7, "work": 5}})
\ No newline at end of file
diff --git a/spark_usage.html b/spark_usage.html
index 603cb506..04a27524 100644
--- a/spark_usage.html
+++ b/spark_usage.html
@@ -6,7 +6,7 @@
 <link rel="index" title="Index" href="genindex.html" /><link rel="search" title="Search" href="search.html" /><link rel="next" title="Polars Usage" href="polars_usage.html" /><link rel="prev" title="Pandas Usage" href="pandas_usage.html" />
 
     <!-- Generated with Sphinx 7.4.7 and Furo 2024.08.06 -->
-        <title>Spark Usage - datacompy 0.14.0 documentation</title>
+        <title>Spark Usage - datacompy 0.14.1 documentation</title>
       <link rel="stylesheet" type="text/css" href="_static/pygments.css?v=fa44fd50" />
     <link rel="stylesheet" type="text/css" href="_static/styles/furo.css?v=354aac6f" />
     <link rel="stylesheet" type="text/css" href="_static/styles/furo-extensions.css?v=302659d7" />
@@ -166,7 +166,7 @@
       </label>
     </div>
     <div class="header-center">
-      <a href="index.html"><div class="brand">datacompy 0.14.0 documentation</div></a>
+      <a href="index.html"><div class="brand">datacompy 0.14.1 documentation</div></a>
     </div>
     <div class="header-right">
       <div class="theme-toggle-container theme-toggle-header">
@@ -190,7 +190,7 @@
       <div class="sidebar-sticky"><a class="sidebar-brand" href="index.html">
   
   
-  <span class="sidebar-brand-text">datacompy 0.14.0 documentation</span>
+  <span class="sidebar-brand-text">datacompy 0.14.1 documentation</span>
   
 </a><form class="sidebar-search-container" method="get" action="search.html" role="search">
   <input class="sidebar-search" placeholder="Search" name="q" aria-label="Search">
@@ -275,30 +275,26 @@ <h1>Spark Usage<a class="headerlink" href="#spark-usage" title="Link to this hea
 </pre></div>
 </div>
 </div>
-<p>For both <code class="docutils literal notranslate"><span class="pre">SparkSQLCompare</span></code> and <code class="docutils literal notranslate"><span class="pre">SparkPandasCompare</span></code></p>
+<div class="admonition important">
+<p class="admonition-title">Important</p>
+<p>Starting with <code class="docutils literal notranslate"><span class="pre">v0.14.1</span></code>, <code class="docutils literal notranslate"><span class="pre">SparkPandasCompare</span></code> is slated for deprecation. <code class="docutils literal notranslate"><span class="pre">SparkSQLCompare</span></code>
+is the prefered and much more performant. It should be noted that if you continue to use <code class="docutils literal notranslate"><span class="pre">SparkPandasCompare</span></code>
+that <code class="docutils literal notranslate"><span class="pre">numpy</span></code> 2+ is not supported due to dependnecy issues.</p>
+</div>
+<p>For <code class="docutils literal notranslate"><span class="pre">SparkSQLCompare</span></code></p>
 <ul class="simple">
 <li><p><code class="docutils literal notranslate"><span class="pre">on_index</span></code> is not supported.</p></li>
 <li><p>Joining is done using <code class="docutils literal notranslate"><span class="pre">&lt;=&gt;</span></code> which is the equality test that is safe for null values.</p></li>
-<li><p><code class="docutils literal notranslate"><span class="pre">SparkPandasCompare</span></code> compares <code class="docutils literal notranslate"><span class="pre">pyspark.pandas.DataFrame</span></code>’s</p></li>
 <li><p><code class="docutils literal notranslate"><span class="pre">SparkSQLCompare</span></code> compares <code class="docutils literal notranslate"><span class="pre">pyspark.sql.DataFrame</span></code>’s</p></li>
 </ul>
-<section id="supported-version">
-<h2>Supported Version<a class="headerlink" href="#supported-version" title="Link to this heading">¶</a></h2>
-<div class="admonition important">
-<p class="admonition-title">Important</p>
-<p>Spark will not offically support Pandas 2 until Spark 4: <a class="reference external" href="https://issues.apache.org/jira/browse/SPARK-44101">https://issues.apache.org/jira/browse/SPARK-44101</a></p>
-</div>
-<p>Until then we will not be supporting Pandas 2 for the Pandas on Spark API implementaion.
-For Fugue, the Native Pandas (<cite>Compare</cite>), and <cite>SparkSQLCompare</cite> implementations, Pandas 2 is supported.</p>
-</section>
-<section id="sparkpandascompare-and-sparksqlcompare-object-setup">
-<h2>SparkPandasCompare and SparkSQLCompare Object Setup<a class="headerlink" href="#sparkpandascompare-and-sparksqlcompare-object-setup" title="Link to this heading">¶</a></h2>
+<section id="sparksqlcompare">
+<h2>SparkSQLCompare<a class="headerlink" href="#sparksqlcompare" title="Link to this heading">¶</a></h2>
 <p>There is currently only one supported method for joining your dataframes - by
 join column(s).</p>
 <div class="highlight-python notranslate"><div class="highlight"><pre><span></span><span class="kn">from</span> <span class="nn">io</span> <span class="kn">import</span> <span class="n">StringIO</span>
 <span class="kn">import</span> <span class="nn">pandas</span> <span class="k">as</span> <span class="nn">pd</span>
 <span class="kn">import</span> <span class="nn">pyspark.pandas</span> <span class="k">as</span> <span class="nn">ps</span>
-<span class="kn">from</span> <span class="nn">datacompy</span> <span class="kn">import</span> <span class="n">SparkPandasCompare</span><span class="p">,</span> <span class="n">SparkSQLCompare</span>
+<span class="kn">from</span> <span class="nn">datacompy</span> <span class="kn">import</span>  <span class="n">SparkSQLCompare</span>
 <span class="kn">from</span> <span class="nn">pyspark.sql</span> <span class="kn">import</span> <span class="n">SparkSession</span>
 
 <span class="n">spark</span> <span class="o">=</span> <span class="n">SparkSession</span><span class="o">.</span><span class="n">builder</span><span class="o">.</span><span class="n">getOrCreate</span><span class="p">()</span>
@@ -319,25 +315,6 @@ <h2>SparkPandasCompare and SparkSQLCompare Object Setup<a class="headerlink" hre
 <span class="s2">10000001238,1.05,Loose Seal Bluth,111</span>
 <span class="s2">&quot;&quot;&quot;</span>
 
-<span class="c1"># SparkPandasCompare</span>
-<span class="n">df1</span> <span class="o">=</span> <span class="n">ps</span><span class="o">.</span><span class="n">from_pandas</span><span class="p">(</span><span class="n">pd</span><span class="o">.</span><span class="n">read_csv</span><span class="p">(</span><span class="n">StringIO</span><span class="p">(</span><span class="n">data1</span><span class="p">)))</span>
-<span class="n">df2</span> <span class="o">=</span> <span class="n">ps</span><span class="o">.</span><span class="n">from_pandas</span><span class="p">(</span><span class="n">pd</span><span class="o">.</span><span class="n">read_csv</span><span class="p">(</span><span class="n">StringIO</span><span class="p">(</span><span class="n">data2</span><span class="p">)))</span>
-
-<span class="n">compare</span> <span class="o">=</span> <span class="n">SparkPandasCompare</span><span class="p">(</span>
-    <span class="n">df1</span><span class="p">,</span>
-    <span class="n">df2</span><span class="p">,</span>
-    <span class="n">join_columns</span><span class="o">=</span><span class="s1">&#39;acct_id&#39;</span><span class="p">,</span>  <span class="c1"># You can also specify a list of columns</span>
-    <span class="n">abs_tol</span><span class="o">=</span><span class="mi">0</span><span class="p">,</span>  <span class="c1"># Optional, defaults to 0</span>
-    <span class="n">rel_tol</span><span class="o">=</span><span class="mi">0</span><span class="p">,</span>  <span class="c1"># Optional, defaults to 0</span>
-    <span class="n">df1_name</span><span class="o">=</span><span class="s1">&#39;Original&#39;</span><span class="p">,</span>  <span class="c1"># Optional, defaults to &#39;df1&#39;</span>
-    <span class="n">df2_name</span><span class="o">=</span><span class="s1">&#39;New&#39;</span>  <span class="c1"># Optional, defaults to &#39;df2&#39;</span>
-<span class="p">)</span>
-<span class="n">compare</span><span class="o">.</span><span class="n">matches</span><span class="p">(</span><span class="n">ignore_extra_columns</span><span class="o">=</span><span class="kc">False</span><span class="p">)</span>
-<span class="c1"># False</span>
-<span class="c1"># This method prints out a human-readable report summarizing and sampling differences</span>
-<span class="nb">print</span><span class="p">(</span><span class="n">compare</span><span class="o">.</span><span class="n">report</span><span class="p">())</span>
-
-
 <span class="c1"># SparkSQLCompare</span>
 <span class="n">df1</span> <span class="o">=</span> <span class="n">spark</span><span class="o">.</span><span class="n">createDataFrame</span><span class="p">(</span><span class="n">pd</span><span class="o">.</span><span class="n">read_csv</span><span class="p">(</span><span class="n">StringIO</span><span class="p">(</span><span class="n">data1</span><span class="p">)))</span>
 <span class="n">df2</span> <span class="o">=</span> <span class="n">spark</span><span class="o">.</span><span class="n">createDataFrame</span><span class="p">(</span><span class="n">pd</span><span class="o">.</span><span class="n">read_csv</span><span class="p">(</span><span class="n">StringIO</span><span class="p">(</span><span class="n">data2</span><span class="p">)))</span>
@@ -634,8 +611,7 @@ <h2>Duplicate rows<a class="headerlink" href="#duplicate-rows" title="Link to th
           <div class="toc-tree">
             <ul>
 <li><a class="reference internal" href="#">Spark Usage</a><ul>
-<li><a class="reference internal" href="#supported-version">Supported Version</a></li>
-<li><a class="reference internal" href="#sparkpandascompare-and-sparksqlcompare-object-setup">SparkPandasCompare and SparkSQLCompare Object Setup</a></li>
+<li><a class="reference internal" href="#sparksqlcompare">SparkSQLCompare</a></li>
 <li><a class="reference internal" href="#reports">Reports</a></li>
 <li><a class="reference internal" href="#convenience-methods">Convenience Methods</a></li>
 <li><a class="reference internal" href="#duplicate-rows">Duplicate rows</a></li>
@@ -650,7 +626,7 @@ <h2>Duplicate rows<a class="headerlink" href="#duplicate-rows" title="Link to th
       
     </aside>
   </div>
-</div><script src="_static/documentation_options.js?v=9e420a66"></script>
+</div><script src="_static/documentation_options.js?v=3a3a8e7f"></script>
     <script src="_static/doctools.js?v=9a2dae69"></script>
     <script src="_static/sphinx_highlight.js?v=dc90522c"></script>
     <script src="_static/scripts/furo.js?v=5fa4622c"></script>