danforthcenter · afinit · Jul 8, 2023 · Jul 8, 2023 · Jul 8, 2023 · Jul 11, 2023
diff --git a/docs/jupyter.md b/docs/jupyter.md
@@ -132,7 +132,7 @@ img, imgpath, imgname = pcv.readimage(filename=args.image)
 # Jupyter here
 
 # Print data that gets collected into the Outputs 
-pcv.outputs.save_results(filename=args.result, outformat="json")
+pcv.outputs.save_results(filename=args.result, outformat="json", append=True)
 
 ```
 

diff --git a/docs/outputs.md b/docs/outputs.md
@@ -68,12 +68,15 @@ Methods are accessed as plantcv.outputs.*method*.
 
 * label:  The label for each value, which will be useful when the data is a frequency table (e.g. hues). 
 
-**save_results**(*filename, outformat="json"*): Save results to a file
+**save_results**(*filename, outformat="json", append=True*): Save results to a file
 
 * filename: Path and name of the output file
 
 * outformat: Output file format (default = "json"). Supports "json" and "csv" formats
 
+* append: When true, **save_results** will append to existing files. In a json file, this overwrites existing observations with the same label.
+In a csv file, this duplicates the same label. When this is false, **save_results** will overwrite existing files.
+
 **Example use:**
     - [Use In VIS/NIR Tutorial](tutorials/vis_nir_tutorial.md)
 
@@ -91,7 +94,7 @@ shape_img = pcv.analyze.size(img=img, labeled_mask=mask, n_labels=1, label="defa
 plant_area = pcv.outputs.observations['default1']['pixel_area']['value']
 
 # Write shape data to results file
-pcv.outputs.save_results(filename=args.result, outformat="json")
+pcv.outputs.save_results(filename=args.result, outformat="json", append=True)
 
 # Will will print out results again, so clear the outputs before running NIR analysis 
 pcv.outputs.clear()
@@ -102,7 +105,7 @@ nir_hist = pcv.analyze.grayscale(gray_img=nir2, labeled_mask=nir_combinedmask, n
 shape_img = pcv.analyze.size(img=nir2, labeled_mask=nir_combinedmask, n_labels=1, label="default")
 
 # Write the NIR and shape data to a file 
-pcv.outputs.save_results(filename=args.coresult, outformat="json")
+pcv.outputs.save_results(filename=args.coresult, outformat="json", append=True)
 
 ```
 
@@ -125,7 +128,7 @@ pcv.outputs.add_observation(sample='default', variable='percent_diseased',
                             value=percent_diseased, label='percent')
 
 # Write custom data to results file
-pcv.outputs.save_results(filename=args.result, outformat="json")
+pcv.outputs.save_results(filename=args.result, outformat="json", append=True)
 
 ```
 

diff --git a/docs/updating.md b/docs/updating.md
@@ -688,6 +688,7 @@ pages for more details on the input and output variable types.
 
 * pre v3.12: NA
 * post v3.12: **plantcv.outputs.save_results**(*filename, outformat="json"*)
+* post v4.0: **plantcv.outputs.save_results**(*filename, outformat="json", append=True*)
 
 #### plantcv.photosynthesis.analyze_fvfm
 

diff --git a/plantcv/plantcv/classes.py b/plantcv/plantcv/classes.py
@@ -128,7 +128,7 @@ def add_observation(self, sample, variable, trait, method, scale, datatype, valu
         }
 
     # Method to save observations to a file
-    def save_results(self, filename, outformat="json"):
+    def save_results(self, filename, outformat="json", append=True):
         """Save results to a file.
 
         Keyword arguments/parameters:
@@ -142,48 +142,59 @@ def save_results(self, filename, outformat="json"):
             if os.path.isfile(filename):
                 with open(filename, 'r') as f:
                     hierarchical_data = json.load(f)
-                    hierarchical_data["observations"] = self.observations
+                    if append:
+                        observations = hierarchical_data["observations"] | self.observations
+                    else:
+                        observations = self.observations
+
+                    hierarchical_data["observations"] = observations
             else:
                 hierarchical_data = {"metadata": {}, "observations": self.observations}
 
             with open(filename, mode='w') as f:
                 json.dump(hierarchical_data, f)
         elif outformat.upper() == "CSV":
+            if append and os.path.isfile(filename):
+                mode = "a"
+            else:
+                mode = "w"
             # Open output CSV file
-            csv_table = open(filename, "w")
-            # Write the header
-            csv_table.write(",".join(map(str, ["sample", "trait", "value", "label"])) + "\n")
-            # Iterate over data samples
-            for sample in self.observations:
-                # Iterate over traits for each sample
-                for var in self.observations[sample]:
-                    val = self.observations[sample][var]["value"]
-                    # If the data type is a list or tuple we need to unpack the data
-                    if isinstance(val, (list, tuple)):
-                        # Combine each value with its label
-                        for value, label in zip(self.observations[sample][var]["value"],
-                                                self.observations[sample][var]["label"]):
-                            # Skip list of tuple data types
-                            if not isinstance(value, tuple):
-                                # Save one row per value-label
-                                row = [sample, var, value, label]
-                                csv_table.write(",".join(map(str, row)) + "\n")
-                    # If the data type is Boolean, store as a numeric 1/0 instead of True/False
-                    elif isinstance(val, bool):
-                        row = [sample,
-                               var,
-                               int(self.observations[sample][var]["value"]),
-                               self.observations[sample][var]["label"]]
-                        csv_table.write(",".join(map(str, row)) + "\n")
-                    # For all other supported data types, save one row per trait
-                    # Assumes no unusual data types are present (possibly a bad assumption)
-                    else:
-                        row = [sample,
-                               var,
-                               self.observations[sample][var]["value"],
-                               self.observations[sample][var]["label"]
-                               ]
-                        csv_table.write(",".join(map(str, row)) + "\n")
+            with open(filename, mode) as csv_table:
+                # Write the header if not appending
+                if mode == "w":
+                    csv_table.write(",".join(map(str, ["sample", "trait", "value", "label"])) + "\n")
+
+                # Iterate over data samples
+                for sample in self.observations:
+                    # Iterate over traits for each sample
+                    for var in self.observations[sample]:
+                        val = self.observations[sample][var]["value"]
+                        # If the data type is a list or tuple we need to unpack the data
+                        if isinstance(val, (list, tuple)):
+                            # Combine each value with its label
+                            for value, label in zip(self.observations[sample][var]["value"],
+                                                    self.observations[sample][var]["label"]):
+                                # Skip list of tuple data types
+                                if not isinstance(value, tuple):
+                                    # Save one row per value-label
+                                    row = [sample, var, value, label]
+                                    csv_table.write(",".join(map(str, row)) + "\n")
+                        else:
+                            # If the data type is Boolean, store as a numeric 1/0 instead of True/False
+                            if isinstance(val, bool):
+                                outputValue = int(val)
+                            # For all other supported data types, save one row per trait
+                            # Assumes no unusual data types are present (possibly a bad assumption)
+                            else:
+                                outputValue = val
+
+                            row = [sample,
+                                   var,
+                                   outputValue,
+                                   self.observations[sample][var]["label"]]
+                            csv_table.write(",".join(map(str, row)) + "\n")
+        else:
+            raise ValueError("outformat must be one of (case insensitive): ['json', 'csv']")
 
     def plot_dists(self, variable):
         """Plot a distribution of data.

diff --git a/tests/plantcv/test_outputs.py b/tests/plantcv/test_outputs.py
@@ -35,11 +35,24 @@ def test_save_results_json_newfile(tmpdir):
     outputs = Outputs()
     outputs.add_observation(sample='default', variable='test', trait='test variable', method='test', scale='none',
                             datatype=str, value="test", label="none")
-    outputs.save_results(filename=outfile, outformat="json")
+    outputs.save_results(filename=outfile, outformat="json", append=False)
     with open(outfile, "r") as fp:
         results = json.load(fp)
         assert results["observations"]["default"]["test"]["value"] == "test"
 
+def test_save_results_json_newfile_append(tmpdir):
+    """Test for PlantCV."""
+    # Create a test tmp directory
+    cache_dir = tmpdir.mkdir("cache")
+    outfile = os.path.join(cache_dir, "results.json")
+    # Create output instance
+    outputs = Outputs()
+    outputs.add_observation(sample='default', variable='test', trait='test variable', method='test', scale='none',
+                            datatype=str, value="test", label="none")
+    outputs.save_results(filename=outfile, outformat="json", append=True)
+    with open(outfile, "r") as fp:
+        results = json.load(fp)
+        assert results["observations"]["default"]["test"]["value"] == "test"
 
 def test_save_results_json_existing_file(test_data, tmpdir):
     """Test for PlantCV."""
@@ -51,11 +64,34 @@ def test_save_results_json_existing_file(test_data, tmpdir):
     outputs = Outputs()
     outputs.add_observation(sample='default', variable='test', trait='test variable', method='test', scale='none',
                             datatype=str, value="test", label="none")
-    outputs.save_results(filename=outfile, outformat="json")
+    outputs.save_results(filename=outfile, outformat="json", append=False)
     with open(outfile, "r") as fp:
         results = json.load(fp)
         assert results["observations"]["default"]["test"]["value"] == "test"
 
+def test_save_results_json_existing_file_append(test_data, tmpdir):
+    """Test for PlantCV."""
+    # Create a test tmp directory
+    cache_dir = tmpdir.mkdir("cache")
+    outfile = os.path.join(cache_dir, os.path.basename(test_data.outputs_results_json))
+    copyfile(test_data.outputs_results_json, outfile)
+    # Create output instance
+    outputs = Outputs()
+    outputs.add_observation(sample='default', variable='test', trait='test variable', method='test', scale='none',
+                            datatype=str, value="test", label="none")
+    outputs.save_results(filename=outfile, outformat="json", append=True)
+
+    outputs2 = Outputs()
+    outputs2.add_observation(sample='default', variable='test', trait='test variable', method='test', scale='none',
+                            datatype=str, value="this data overwrites the original value for this", label="none")
+    outputs2.add_observation(sample='newdatas', variable='test', trait='test variable', method='test', scale='none',
+                            datatype=str, value="some data here", label="none")
+    outputs2.save_results(filename=outfile, outformat="json", append=True)
+
+    with open(outfile, "r") as fp:
+        results = json.load(fp)
+        assert results["observations"]["default"]["test"]["value"] == "this data overwrites the original value for this"
+        assert results["observations"]["newdatas"]["test"]["value"] == "some data here"
 
 def test_save_results_csv(test_data, tmpdir):
     """Test for PlantCV."""
@@ -69,18 +105,30 @@ def test_save_results_csv(test_data, tmpdir):
                             scale='none', datatype=bool, value=True, label="none")
     outputs.add_observation(sample='default', variable='list', trait='list variable', method='list',
                             scale='none', datatype=list, value=[1, 2, 3], label=[1, 2, 3])
-    outputs.add_observation(sample='default', variable='tuple', trait='tuple variable', method='tuple',
+    outputs.save_results(filename=outfile, outformat="csv", append=True)
+
+    outputs2 = Outputs()
+    outputs2.add_observation(sample='default', variable='tuple', trait='tuple variable', method='tuple',
                             scale='none', datatype=tuple, value=(1, 2), label=(1, 2))
-    outputs.add_observation(sample='default', variable='tuple_list', trait='list of tuples variable',
+    outputs2.add_observation(sample='default', variable='tuple_list', trait='list of tuples variable',
                             method='tuple_list', scale='none', datatype=list, value=[(1, 2), (3, 4)], label=[1, 2])
-    outputs.save_results(filename=outfile, outformat="csv")
+    outputs2.save_results(filename=outfile, outformat="csv", append=True)
+
     with open(outfile, "r") as fp:
         results = fp.read()
     with open(test_data.outputs_results_csv, "r") as fp:
         test_results = fp.read()
     assert results == test_results
 
 
+def test_save_results_invalid_outformat():
+    """Test for PlantCV."""
+    # Create output instance
+    outputs = Outputs()
+    with pytest.raises(ValueError):
+        outputs.save_results(filename="filename does not matter for this test", outformat="INVALIDOUTFORMAT")
+
+
 def test_clear_outputs():
     """Test for PlantCV."""
     # Create output instance