diff --git a/raster/r.kappa/calc_kappa.c b/raster/r.kappa/calc_kappa.c
index 431a718954b..ba4d15943c2 100644
--- a/raster/r.kappa/calc_kappa.c
+++ b/raster/r.kappa/calc_kappa.c
@@ -8,6 +8,7 @@
 void calc_kappa(void)
 {
     int i, j;
+    int a_i, b_i;
     int s, l;
     int nl;
     size_t ns;
@@ -37,10 +38,10 @@ void calc_kappa(void)
     total = count_sum(&s, l);
 
     /* calculate the parameters of the kappa-calculation */
-    pi = (double *)G_calloc(ns, sizeof(double));
-    pj = (double *)G_calloc(ns, sizeof(double));
-    pii = (double *)G_calloc(ns, sizeof(double));
-    kpp = (double *)G_calloc(ns, sizeof(double));
+    pi = (double *)G_calloc(ncat, sizeof(double));
+    pj = (double *)G_calloc(ncat, sizeof(double));
+    pii = (double *)G_calloc(ncat, sizeof(double));
+    kpp = (double *)G_calloc(ncat, sizeof(double));
 
     for (i = 0; i < ncat; i++) {
         for (j = 0; j < ns; j++) {
@@ -65,31 +66,46 @@ void calc_kappa(void)
         pC += pi[i] * pj[i];
     }
 
-    for (i = 0; i < ncat; i++)
-        if ((pi[i] == 0) || (pj[i] == 0))
+    for (i = 0; i < ncat; i++) {
+        if (pi[i] == 0)
             kpp[i] = -999;
         else
             kpp[i] = (pii[i] - pi[i] * pj[i]) / (pi[i] - pi[i] * pj[i]);
+    }
 
     /* print out the comission and omission accuracy, and conditional kappa */
     fprintf(fd, "\nCats\t%% Comission\t%% Omission\tEstimated Kappa\n");
-    for (i = 0; i < ncat; i++)
-        if ((kpp[i] == -999) && (i != 0))
-            fprintf(fd, "%ld\tNA\t\tNA\t\tNA\n", rlst[i]);
+    for (i = 0; i < ncat; i++) {
+        fprintf(fd, "%ld\t", rlst[i]);
+        if (pi[i] == 0)
+            fprintf(fd, "NA\t\t");
+        else
+            fprintf(fd, "%f\t", 100 * (1 - pii[i] / pi[i]));
+        if (pj[i] == 0)
+            fprintf(fd, "NA\t\t");
         else
-            fprintf(fd, "%ld\t%f\t%f\t%f\n",
-                    rlst[i], 100 * (1 - pii[i] / pi[i]),
-                    100 * (1 - pii[i] / pj[i]), kpp[i]);
+            fprintf(fd, "%f\t", 100 * (1 - pii[i] / pj[i]));
+        if (kpp[i] == -999)
+            fprintf(fd, "NA\n");
+        else
+            fprintf(fd, "%f\n", kpp[i]);
+    }
     fprintf(fd, "\n");
 
     for (i = 0; i < ncat; i++) {
         inter1 += pii[i] * pow(((1 - pC) - (1 - p0) * (pi[i] + pj[i])), 2.);
     }
+
     for (j = 0; j < ns; j++) {
-        if (Gstats[j].cats[0] != Gstats[j].cats[1])
-            inter2 += Gstats[j].count *
-                pow((pi[Gstats[j].cats[0] - 1] + pj[Gstats[j].cats[1] - 1]),
-                    2.) / total;
+        if (Gstats[j].cats[0] != Gstats[j].cats[1]) {
+            for (i = 0; i < ncat; i++) {
+                if (Gstats[j].cats[0] == rlst[i])
+                    a_i = i;
+                if (Gstats[j].cats[1] == rlst[i])
+                    b_i = i;
+            }
+            inter2 += Gstats[j].count * pow((pi[a_i] + pj[b_i]), 2.) / total;
+        }
     }
     kp = (p0 - pC) / (1 - pC);
     vkp = (inter1 + pow((1 - p0), 2.) * inter2 -
diff --git a/raster/r.kappa/prt2csv_mat.c b/raster/r.kappa/prt2csv_mat.c
index f870f8a1617..0ac370fc581 100644
--- a/raster/r.kappa/prt2csv_mat.c
+++ b/raster/r.kappa/prt2csv_mat.c
@@ -97,8 +97,9 @@ void prn2csv_error_mat(int out_cols, int hdr)
             if (cl)
                 G_strip(cl);
             if (cl == NULL || *cl == 0)
-                cl = "NULL";
-            fprintf(fd, "%s\t", cl);
+                fprintf(fd, "%ld\t", cats[j]);
+            else
+                fprintf(fd, "%s\t", cl);
         }
         /*for (cndx = first_col; cndx < last_col; cndx++) */
         /*    fprintf(fd, "%ld\t", rlst[cndx]); */
@@ -112,8 +113,9 @@ void prn2csv_error_mat(int out_cols, int hdr)
             if (cl)
                 G_strip(cl);
             if (cl == NULL || *cl == 0)
-                cl = "NULL";
-            fprintf(fd, "%s\t", cl);
+                fprintf(fd, "%ld\t", cats[rndx]);
+            else
+                fprintf(fd, "%s\t", cl);
             /* entries */
             for (cndx = first_col; cndx < last_col; cndx++) {
                 thisone = (ncat * rndx) + cndx;
diff --git a/raster/r.kappa/testsuite/data/class_1.ascii b/raster/r.kappa/testsuite/data/class_1.ascii
new file mode 100644
index 00000000000..b548d1d634d
--- /dev/null
+++ b/raster/r.kappa/testsuite/data/class_1.ascii
@@ -0,0 +1,14 @@
+north:  5
+south:  0
+east:   5
+west:   0
+rows:   5
+cols:   5
+null:   n
+type:   int
+
+1 n 3 3 4
+5 3 1 4 n
+n 1 3 6 6
+6 n 6 1 3
+4 4 4 4 3
diff --git a/raster/r.kappa/testsuite/data/class_2.ascii b/raster/r.kappa/testsuite/data/class_2.ascii
new file mode 100644
index 00000000000..15b47aedbc8
--- /dev/null
+++ b/raster/r.kappa/testsuite/data/class_2.ascii
@@ -0,0 +1,14 @@
+north:  5
+south:  0
+east:   5
+west:   0
+rows:   5
+cols:   5
+null:   n
+type:   int
+
+9 9 9 9 9
+9 9 9 9 9
+9 9 9 9 9
+9 9 9 9 9
+9 9 9 9 9
diff --git a/raster/r.kappa/testsuite/data/ref_1.ascii b/raster/r.kappa/testsuite/data/ref_1.ascii
new file mode 100644
index 00000000000..320571cbe1f
--- /dev/null
+++ b/raster/r.kappa/testsuite/data/ref_1.ascii
@@ -0,0 +1,14 @@
+north:  5
+south:  0
+east:   5
+west:   0
+rows:   5
+cols:   5
+null:   n
+type:   int
+
+1 3 n 3 6
+5 3 1 n n
+n 1 2 2 2
+6 n 6 1 3
+1 1 1 n 3
diff --git a/raster/r.kappa/testsuite/data/ref_2.ascii b/raster/r.kappa/testsuite/data/ref_2.ascii
new file mode 100644
index 00000000000..eceb8ac4a5d
--- /dev/null
+++ b/raster/r.kappa/testsuite/data/ref_2.ascii
@@ -0,0 +1,14 @@
+north:  5
+south:  0
+east:   5
+west:   0
+rows:   5
+cols:   5
+null:   n
+type:   int
+
+0 1 2 1 0
+1 2 3 2 1
+2 3 4 3 2
+1 2 3 2 1
+0 1 2 1 0
diff --git a/raster/r.kappa/testsuite/test_r_kappa.py b/raster/r.kappa/testsuite/test_r_kappa.py
new file mode 100644
index 00000000000..fc85a3c1a4e
--- /dev/null
+++ b/raster/r.kappa/testsuite/test_r_kappa.py
@@ -0,0 +1,296 @@
+"""
+Name:      r.kappa tests
+Purpose:   Validates accuracy calculations and output
+
+Author:    Maris Nartiss
+Copyright: (C) 2022 by Maris Nartiss and the GRASS Development Team
+Licence:   This program is free software under the GNU General Public
+           License (>=v2). Read the file COPYING that comes with GRASS
+           for details.
+"""
+
+import os
+import pathlib
+
+from grass.script import read_command
+from grass.script.core import tempname
+from grass.gunittest.case import TestCase
+from grass.gunittest.main import test
+
+
+class MatrixCorrectnessTest(TestCase):
+    """Test correctness of calculated matrix"""
+
+    @classmethod
+    def setUpClass(cls):
+        """Import sample maps with known properties"""
+        cls.use_temp_region()
+        cls.runModule("g.region", n=5, s=0, e=5, w=0, res=1)
+
+        cls.data_dir = os.path.join(pathlib.Path(__file__).parent.absolute(), "data")
+        cls.ref_1 = tempname(10)
+        cls.runModule(
+            "r.in.ascii",
+            input=os.path.join(cls.data_dir, "ref_1.ascii"),
+            output=cls.ref_1,
+            quiet=True,
+        )
+        cls.class_1 = tempname(10)
+        cls.runModule(
+            "r.in.ascii",
+            input=os.path.join(cls.data_dir, "class_1.ascii"),
+            output=cls.class_1,
+            quiet=True,
+        )
+
+    @classmethod
+    def tearDownClass(cls):
+        """Remove temporary data"""
+        cls.del_temp_region()
+        cls.runModule("g.remove", flags="f", type="raster", name=cls.ref_1)
+        cls.runModule("g.remove", flags="f", type="raster", name=cls.class_1)
+
+    def test_m(self):
+        """Test printing matrix only
+        Implicitly tests calculation of matrix
+        """
+
+        ref = """cat#\t1\t2\t3\t4\t5\t6\tRowSum
+1\t4\t0\t0\t0\t0\t0\t4
+2\t0\t0\t0\t0\t0\t0\t0
+3\t0\t1\t4\t0\t0\t0\t5
+4\t3\t0\t0\t0\t0\t1\t4
+5\t0\t0\t0\t0\t1\t0\t1
+6\t0\t2\t0\t0\t0\t2\t4
+ColSum\t7\t3\t4\t0\t1\t3\t18
+
+"""
+        out = read_command(
+            "r.kappa",
+            reference=self.ref_1,
+            classification=self.class_1,
+            flags="m",
+            quiet=True,
+        )
+        self.assertEqual(out, ref)
+
+
+class CalculationCorrectness1Test(TestCase):
+    """Test correctness of values in printout mode
+    First version of reference data"""
+
+    @classmethod
+    def setUpClass(cls):
+        """Import sample maps with known properties"""
+        cls.use_temp_region()
+        cls.runModule("g.region", n=5, s=0, e=5, w=0, res=1)
+
+        cls.data_dir = os.path.join(pathlib.Path(__file__).parent.absolute(), "data")
+        cls.ref_1 = tempname(10)
+        cls.runModule(
+            "r.in.ascii",
+            input=os.path.join(cls.data_dir, "ref_1.ascii"),
+            output=cls.ref_1,
+            quiet=True,
+        )
+        cls.class_1 = tempname(10)
+        cls.runModule(
+            "r.in.ascii",
+            input=os.path.join(cls.data_dir, "class_1.ascii"),
+            output=cls.class_1,
+            quiet=True,
+        )
+        cls.per_class = {
+            "producer": [
+                100 - 57.143,
+                100 - 0.0,
+                100 - 100.0,
+                "NA",
+                100 - 100.0,
+                100 - 66.666,
+            ],
+            "user": [100 - 100.0, "NA", 100 - 80.0, 100 - 0.0, 100 - 100.0, 100 - 50.0],
+            "cond.kappa": [1.0, "NA", 0.743, 0.0, 1.0, 0.4],
+        }
+
+    @classmethod
+    def tearDownClass(cls):
+        """Remove temporary data"""
+        cls.del_temp_region()
+        cls.runModule("g.remove", flags="f", type="raster", name=cls.ref_1)
+        cls.runModule("g.remove", flags="f", type="raster", name=cls.class_1)
+
+    def match(self, pat, ref):
+        if pat == "NA" or ref == "NA":
+            return pat == ref
+        try:
+            val = float(pat)
+        except ValueError:
+            return False
+        return ref - val < 0.001
+
+    # Characteristics of the matrix
+    # All values were obtained according to formulas given in
+    # Rossiter 2004. Technical Note: Statistical methods for accuracy
+    # assessment of classified thematic maps.
+    # Only exception is Kappa variance as attempts to follow formulas given
+    # by Rossiter lead to a spectacular failure (most likely due to
+    # poor math skills of the author of this testing code). Thus Kappa
+    # variance is not validated as "good" value is not known.
+    # Overall Cohen Kappa value: 0.52091
+    # Observation count: 18
+    # Correct count: 11
+    # Overall accuracy: 0.61111
+    # CAT TP TN FP FN Prod  User  pii   pi+   p+i   conditional kappa
+    # 1   4  11 0  3  0.571 1.000 0.222 0.222 0.389 1.000
+    # 2   0  15 0  3  0.000 -     0.000 0.000 0.167 -
+    # 3   4  13 1  0  1.000 0.800 0.222 0.278 0.222 0.743
+    # 4   0  14 4  0  -     0.000 0.000 0.222 0.000 0.000
+    # 5   1  17 0  0  1.000 1.000 0.056 0.056 0.056 1.000
+    # 6   2  13 2  1  0.667 0.500 0.111 0.222 0.167 0.400
+
+    def test_standard_output(self):
+        out = read_command(
+            "r.kappa",
+            reference=self.ref_1,
+            classification=self.class_1,
+            flags="w",
+            quiet=True,
+        )
+        rows = out.splitlines()
+
+        # Matrix part
+        self.assertEqual(rows[10], " M     1\t4\t0\t0\t0\t0\t0\t4")
+        self.assertEqual(rows[11], " A     2\t0\t0\t0\t0\t0\t0\t0")
+        self.assertEqual(rows[12], " P     3\t0\t1\t4\t0\t0\t0\t5")
+        self.assertEqual(rows[13], " 2     4\t3\t0\t0\t0\t0\t1\t4")
+        self.assertEqual(rows[14], "       5\t0\t0\t0\t0\t1\t0\t1")
+        self.assertEqual(rows[15], "       6\t0\t2\t0\t0\t0\t2\t4")
+        self.assertEqual(rows[16], "Col Sum\t\t7\t3\t4\t0\t1\t3\t18")
+
+        # Per class coefficients
+        for c in range(len(self.per_class["producer"])):
+            vals = rows[20 + c].split()
+            # The test on the next line is valid only for this data
+            self.assertEqual(vals[0], str(c + 1))
+            self.assertTrue(self.match(vals[1], self.per_class["user"][c]))
+            self.assertTrue(self.match(vals[2], self.per_class["producer"][c]))
+            self.assertTrue(self.match(vals[3], self.per_class["cond.kappa"][c]))
+
+        # Kappa value
+        vals = rows[28].split()
+        self.assertTrue(self.match(vals[0], 0.52091))
+
+        # Overall characteristics
+        vals = rows[31].split()
+        self.assertEqual(vals[0], "11")
+        self.assertEqual(vals[1], "18")
+        self.assertTrue(self.match(vals[2], 61.111))
+
+
+class CalculationCorrectness2Test(TestCase):
+    """Test correctness of values in printout mode
+    A pathological case when no values match"""
+
+    @classmethod
+    def setUpClass(cls):
+        """Import sample maps with known properties"""
+        cls.use_temp_region()
+        cls.runModule("g.region", n=5, s=0, e=5, w=0, res=1)
+
+        cls.data_dir = os.path.join(pathlib.Path(__file__).parent.absolute(), "data")
+        cls.ref_1 = tempname(10)
+        cls.runModule(
+            "r.in.ascii",
+            input=os.path.join(cls.data_dir, "ref_2.ascii"),
+            output=cls.ref_1,
+            quiet=True,
+        )
+        cls.class_1 = tempname(10)
+        cls.runModule(
+            "r.in.ascii",
+            input=os.path.join(cls.data_dir, "class_2.ascii"),
+            output=cls.class_1,
+            quiet=True,
+        )
+        cls.per_class = {
+            "producer": [
+                100.0,
+                100.0,
+                100.0,
+                100.0,
+                100.0,
+                "NA",
+            ],
+            "user": ["NA", "NA", "NA", "NA", "NA", 100.0],
+            "cond.kappa": ["NA", "NA", "NA", "NA", "NA", 0.0],
+        }
+
+    @classmethod
+    def tearDownClass(cls):
+        """Remove temporary data"""
+        cls.del_temp_region()
+        # cls.runModule("g.remove", flags="f", type="raster", name=cls.ref_1)
+        # cls.runModule("g.remove", flags="f", type="raster", name=cls.class_1)
+
+    def match(self, pat, ref):
+        if pat == "NA" or ref == "NA":
+            return pat == ref
+        try:
+            val = float(pat)
+        except ValueError:
+            return False
+        return ref - val < 0.001
+
+    # Characteristics of the matrix
+    # Overall Cohen Kappa value: 0.0
+    # Observation count: 25
+    # Correct count: 0
+    # Overall accuracy: 0.0
+    # CAT TP  TN  FP  FN  User Producer
+    # 0   0   17  0   8   -    0
+    # 1   0   17  0   8   -    0
+    # 2   0   21  0   4   -    0
+    # 3   0   24  0   1   -    0
+    # 4   0   21  0   4   -    0
+    # 9   0   0   25  0   0    -
+
+    def test_standard_output(self):
+        out = read_command(
+            "r.kappa",
+            reference=self.ref_1,
+            classification=self.class_1,
+            flags="w",
+            quiet=True,
+        )
+        rows = out.splitlines()
+
+        # Matrix part
+        self.assertEqual(rows[10], " M     0\t0\t0\t0\t0\t0\t0\t0")
+        self.assertEqual(rows[11], " A     1\t0\t0\t0\t0\t0\t0\t0")
+        self.assertEqual(rows[12], " P     2\t0\t0\t0\t0\t0\t0\t0")
+        self.assertEqual(rows[13], " 2     3\t0\t0\t0\t0\t0\t0\t0")
+        self.assertEqual(rows[14], "       4\t0\t0\t0\t0\t0\t0\t0")
+        self.assertEqual(rows[15], "       9\t4\t8\t8\t4\t1\t0\t25")
+        self.assertEqual(rows[16], "Col Sum\t\t4\t8\t8\t4\t1\t0\t25")
+
+        # Per class coefficients
+        for c in range(len(self.per_class["producer"])):
+            vals = rows[20 + c].split()
+            self.assertTrue(self.match(vals[1], self.per_class["user"][c]))
+            self.assertTrue(self.match(vals[2], self.per_class["producer"][c]))
+            self.assertTrue(self.match(vals[3], self.per_class["cond.kappa"][c]))
+
+        # Kappa value
+        vals = rows[28].split()
+        self.assertTrue(self.match(vals[0], 0.0))
+
+        # Overall characteristics
+        vals = rows[31].split()
+        self.assertEqual(vals[0], "0")
+        self.assertEqual(vals[1], "25")
+        self.assertTrue(self.match(vals[2], 0.0))
+
+
+if __name__ == "__main__":
+    test()