-
Notifications
You must be signed in to change notification settings - Fork 95
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
Add a outputs pipe module including csv export of results #37
Signed-off-by: Thomas Druez <tdruez@nexb.com>
- Loading branch information
Showing
3 changed files
with
137 additions
and
0 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,63 @@ | ||
# SPDX-License-Identifier: Apache-2.0 | ||
# | ||
# http://nexb.com and https://github.com/nexB/scancode.io | ||
# The ScanCode.io software is licensed under the Apache License version 2.0. | ||
# Data generated with ScanCode.io is provided as-is without warranties. | ||
# ScanCode is a trademark of nexB Inc. | ||
# | ||
# You may not use this software except in compliance with the License. | ||
# You may obtain a copy of the License at: http://apache.org/licenses/LICENSE-2.0 | ||
# Unless required by applicable law or agreed to in writing, software distributed | ||
# under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR | ||
# CONDITIONS OF ANY KIND, either express or implied. See the License for the | ||
# specific language governing permissions and limitations under the License. | ||
# | ||
# Data Generated with ScanCode.io is provided on an "AS IS" BASIS, WITHOUT WARRANTIES | ||
# OR CONDITIONS OF ANY KIND, either express or implied. No content created from | ||
# ScanCode.io should be considered or used as legal advice. Consult an Attorney | ||
# for any legal advice. | ||
# | ||
# ScanCode.io is a free software code scanning tool from nexB Inc. and others. | ||
# Visit https://github.com/nexB/scancode.io for support and download. | ||
|
||
import csv | ||
|
||
from scanpipe.api.serializers import CodebaseResourceSerializer | ||
from scanpipe.api.serializers import DiscoveredPackageSerializer | ||
|
||
|
||
def queryset_to_csv(project, queryset, fieldnames): | ||
""" | ||
Create a csv file from the provided `queryset`. | ||
The fields to include as columns and their order are controlled by the | ||
`fieldnames` list. | ||
The output file is created in the `project` output directory. | ||
""" | ||
model_name = queryset.model._meta.model_name | ||
filename = f"{project.name}_{model_name}.csv" | ||
output_file = project.output_path / filename | ||
|
||
with open(output_file, "w") as csvfile: | ||
writer = csv.DictWriter(csvfile, fieldnames) | ||
writer.writeheader() | ||
for record in queryset.iterator(): | ||
record_dict = {field: getattr(record, field) for field in fieldnames} | ||
writer.writerow(record_dict) | ||
|
||
return output_file | ||
|
||
|
||
def as_csv(project): | ||
""" | ||
Generate results output for the provided `project` as csv format. | ||
Since the csv format does not support multiple tabs, one file is created | ||
per object type. | ||
""" | ||
data_sources = [ | ||
(project.discoveredpackages.all(), DiscoveredPackageSerializer), | ||
(project.codebaseresources.without_symlinks(), CodebaseResourceSerializer), | ||
] | ||
|
||
for queryset, serializer in data_sources: | ||
fieldnames = list(serializer().get_fields().keys()) | ||
queryset_to_csv(project, queryset, fieldnames) |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,70 @@ | ||
# SPDX-License-Identifier: Apache-2.0 | ||
# | ||
# http://nexb.com and https://github.com/nexB/scancode.io | ||
# The ScanCode.io software is licensed under the Apache License version 2.0. | ||
# Data generated with ScanCode.io is provided as-is without warranties. | ||
# ScanCode is a trademark of nexB Inc. | ||
# | ||
# You may not use this software except in compliance with the License. | ||
# You may obtain a copy of the License at: http://apache.org/licenses/LICENSE-2.0 | ||
# Unless required by applicable law or agreed to in writing, software distributed | ||
# under the License is distributed on an "AS IS" BASIS, WITHOUT WARRANTIES OR | ||
# CONDITIONS OF ANY KIND, either express or implied. See the License for the | ||
# specific language governing permissions and limitations under the License. | ||
# | ||
# Data Generated with ScanCode.io is provided on an "AS IS" BASIS, WITHOUT WARRANTIES | ||
# OR CONDITIONS OF ANY KIND, either express or implied. No content created from | ||
# ScanCode.io should be considered or used as legal advice. Consult an Attorney | ||
# for any legal advice. | ||
# | ||
# ScanCode.io is a free software code scanning tool from nexB Inc. and others. | ||
# Visit https://github.com/nexB/scancode.io for support and download. | ||
|
||
from django.test import TestCase | ||
|
||
from scanpipe.models import CodebaseResource | ||
from scanpipe.models import DiscoveredPackage | ||
from scanpipe.models import Project | ||
from scanpipe.pipes import outputs | ||
from scanpipe.tests import package_data1 | ||
|
||
|
||
class ScanPipePipesTest(TestCase): | ||
def test_scanpipe_pipes_outputs_queryset_to_csv(self): | ||
project1 = Project.objects.create(name="Analysis") | ||
codebase_resource = CodebaseResource.objects.create( | ||
project=project1, | ||
path="filename.ext", | ||
) | ||
DiscoveredPackage.create_for_resource( | ||
package_data1, | ||
codebase_resource, | ||
) | ||
|
||
queryset = project1.discoveredpackages.all() | ||
fieldnames = ["purl", "name", "version"] | ||
output_file = outputs.queryset_to_csv(project1, queryset, fieldnames) | ||
|
||
expected = [ | ||
"purl,name,version\n", | ||
"pkg:deb/debian/adduser@3.118?arch=all,adduser,3.118\n", | ||
] | ||
with output_file.open() as f: | ||
self.assertEqual(expected, f.readlines()) | ||
|
||
queryset = project1.codebaseresources.all() | ||
fieldnames = ["for_packages", "path"] | ||
output_file = outputs.queryset_to_csv(project1, queryset, fieldnames) | ||
|
||
expected = [ | ||
"for_packages,path\n", | ||
"['pkg:deb/debian/adduser@3.118?arch=all'],filename.ext\n", | ||
] | ||
with output_file.open() as f: | ||
self.assertEqual(expected, f.readlines()) | ||
|
||
def test_scanpipe_pipes_outputs_as_csv(self): | ||
project1 = Project.objects.create(name="Analysis") | ||
outputs.as_csv(project=project1) | ||
expected = ["Analysis_codebaseresource.csv", "Analysis_discoveredpackage.csv"] | ||
self.assertEqual(expected, project1.output_root) |