aboutsummaryrefslogtreecommitdiffstats
path: root/test/lib
diff options
context:
space:
mode:
authorMatthias Baumgartner <dev@igsor.net>2022-12-18 14:22:31 +0100
committerMatthias Baumgartner <dev@igsor.net>2022-12-18 14:22:31 +0100
commit7582c280ad5324a2f0427999911c7e7abc14a6ab (patch)
tree0a59bbfe1c44d3497daad9f25ff9e7eb2bf9eb82 /test/lib
parentcb49e4567a18de6851286ff672e54f9a91865fe9 (diff)
parent057e09d6537bf5c39815661a75819081e3e5fda7 (diff)
downloadbsie-7582c280ad5324a2f0427999911c7e7abc14a6ab.tar.gz
bsie-7582c280ad5324a2f0427999911c7e7abc14a6ab.tar.bz2
bsie-7582c280ad5324a2f0427999911c7e7abc14a6ab.zip
Merge branch 'develop' into main
Diffstat (limited to 'test/lib')
-rw-r--r--test/lib/__init__.py0
-rw-r--r--test/lib/test_bsie.py179
-rw-r--r--test/lib/testfile.t1
3 files changed, 180 insertions, 0 deletions
diff --git a/test/lib/__init__.py b/test/lib/__init__.py
new file mode 100644
index 0000000..e69de29
--- /dev/null
+++ b/test/lib/__init__.py
diff --git a/test/lib/test_bsie.py b/test/lib/test_bsie.py
new file mode 100644
index 0000000..771a0c2
--- /dev/null
+++ b/test/lib/test_bsie.py
@@ -0,0 +1,179 @@
+"""
+
+Part of the bsie test suite.
+A copy of the license is provided with the project.
+Author: Matthias Baumgartner, 2022
+"""
+# imports
+import os
+import unittest
+
+# bsie imports
+from bsie.base import extractor
+from bsie.tools import builder
+from bsie.utils import bsfs, node, ns
+
+# objects to test
+from bsie.lib.bsie import BSIE
+
+
+## code ##
+
+class TestBSIE(unittest.TestCase):
+ def setUp(self):
+ # reader builder
+ rbuild = builder.ReaderBuilder({})
+ # extractor builder
+ ebuild = builder.ExtractorBuilder([
+ {'bsie.extractor.generic.path.Path': {}},
+ {'bsie.extractor.generic.stat.Stat': {}},
+ {'bsie.extractor.generic.constant.Constant': dict(
+ tuples=[('http://bsfs.ai/schema/Entity#author', 'Me, myself, and I')],
+ schema='''
+ bse:author rdfs:subClassOf bsfs:Predicate ;
+ rdfs:domain bsfs:Entity ;
+ rdfs:range xsd:string ;
+ bsfs:unique "true"^^xsd:boolean .
+ ''',
+ )},
+ ])
+ # build pipeline
+ self.prefix = bsfs.Namespace('http://example.com/local/')
+ pbuild = builder.PipelineBuilder(self.prefix, rbuild, ebuild)
+ self.pipeline = pbuild.build()
+
+ def test_construction(self):
+ # pipeline only
+ lib = BSIE(self.pipeline)
+ self.assertSetEqual(set(lib.principals), {
+ ns.bse.filename,
+ ns.bse.filesize,
+ ns.bse.author,
+ })
+ self.assertEqual(lib.schema, bsfs.schema.Schema.from_string(extractor.SCHEMA_PREAMBLE + '''
+ bse:filename rdfs:subClassOf bsfs:Predicate ;
+ rdfs:domain bsfs:File ;
+ rdfs:range xsd:string ;
+ bsfs:unique "false"^^xsd:boolean .
+
+ bse:filesize rdfs:subClassOf bsfs:Predicate ;
+ rdfs:domain bsfs:File ;
+ rdfs:range xsd:integer;
+ bsfs:unique "false"^^xsd:boolean .
+
+ bse:author rdfs:subClassOf bsfs:Predicate ;
+ rdfs:domain bsfs:Entity ;
+ rdfs:range xsd:string ;
+ bsfs:unique "true"^^xsd:boolean .
+ '''))
+
+ # specify collect
+ lib = BSIE(self.pipeline, collect={
+ ns.bse.filesize,
+ ns.bse.author,
+ ns.bse.inexistent,
+ })
+ self.assertSetEqual(set(lib.principals), {
+ ns.bse.filesize,
+ ns.bse.author,
+ })
+ self.assertEqual(lib.schema, bsfs.schema.Schema.from_string(extractor.SCHEMA_PREAMBLE + '''
+ bse:filesize rdfs:subClassOf bsfs:Predicate ;
+ rdfs:domain bsfs:File ;
+ rdfs:range xsd:integer;
+ bsfs:unique "false"^^xsd:boolean .
+
+ bse:author rdfs:subClassOf bsfs:Predicate ;
+ rdfs:domain bsfs:Entity ;
+ rdfs:range xsd:string ;
+ bsfs:unique "true"^^xsd:boolean .
+ '''))
+ # empty collect is disregarded
+ lib = BSIE(self.pipeline, collect={})
+ self.assertSetEqual(set(lib.principals), {
+ ns.bse.filename,
+ ns.bse.filesize,
+ ns.bse.author,
+ })
+ self.assertEqual(lib.schema, bsfs.schema.Schema.from_string(extractor.SCHEMA_PREAMBLE + '''
+ bse:filename rdfs:subClassOf bsfs:Predicate ;
+ rdfs:domain bsfs:File ;
+ rdfs:range xsd:string ;
+ bsfs:unique "false"^^xsd:boolean .
+
+ bse:filesize rdfs:subClassOf bsfs:Predicate ;
+ rdfs:domain bsfs:File ;
+ rdfs:range xsd:integer;
+ bsfs:unique "false"^^xsd:boolean .
+
+ bse:author rdfs:subClassOf bsfs:Predicate ;
+ rdfs:domain bsfs:Entity ;
+ rdfs:range xsd:string ;
+ bsfs:unique "true"^^xsd:boolean .
+
+ '''))
+
+ # specify discard
+ lib = BSIE(self.pipeline, discard={
+ ns.bse.filesize,
+ ns.bse.filename,
+ ns.bse.inexistent,
+ })
+ self.assertSetEqual(set(lib.principals), {
+ ns.bse.author,
+ })
+ self.assertEqual(lib.schema, bsfs.schema.Schema.from_string(extractor.SCHEMA_PREAMBLE + '''
+ bse:author rdfs:subClassOf bsfs:Predicate ;
+ rdfs:domain bsfs:Entity ;
+ rdfs:range xsd:string ;
+ bsfs:unique "true"^^xsd:boolean .
+ '''))
+
+ # specify collect and discard
+ lib = BSIE(self.pipeline,
+ collect={ns.bse.filesize, ns.bse.author, ns.bse.foo, ns.bse.bar},
+ discard={ns.bse.author, ns.bse.foo, ns.bse.foobar},
+ )
+ self.assertSetEqual(set(lib.principals), {
+ ns.bse.filesize,
+ })
+ self.assertEqual(lib.schema, bsfs.schema.Schema.from_string(extractor.SCHEMA_PREAMBLE + '''
+ bse:filesize rdfs:subClassOf bsfs:Predicate ;
+ rdfs:domain bsfs:File ;
+ rdfs:range xsd:integer;
+ bsfs:unique "false"^^xsd:boolean .
+
+ '''))
+
+
+ def test_from_file(self):
+ # setup
+ lib = BSIE(self.pipeline)
+ self.assertSetEqual(set(lib.principals), {
+ ns.bse.filesize,
+ ns.bse.filename,
+ ns.bse.author,
+ })
+ content_hash = 'a948904f2f0f479b8f8197694b30184b0d2ed1c1cd2a1ec0fb85d299a192a447'
+ subject = node.Node(ns.bsfs.File, (self.prefix + 'file#')[content_hash])
+ testfile = os.path.join(os.path.dirname(__file__), 'testfile.t')
+
+ # from_file extracts all available triples
+ self.assertSetEqual(set(lib.from_file(testfile)), {
+ (subject, lib.schema.predicate(ns.bse.filename), 'testfile.t'),
+ (subject, lib.schema.predicate(ns.bse.filesize), 12),
+ (subject, lib.schema.predicate(ns.bse.author), 'Me, myself, and I'),
+ })
+
+ # from_file respects predicate argument
+ self.assertSetEqual(set(lib.from_file(testfile, {ns.bse.filename, ns.bse.invalid})), {
+ (subject, lib.schema.predicate(ns.bse.filename), 'testfile.t'),
+ })
+
+
+## main ##
+
+if __name__ == '__main__':
+ unittest.main()
+
+## EOF ##
diff --git a/test/lib/testfile.t b/test/lib/testfile.t
new file mode 100644
index 0000000..3b18e51
--- /dev/null
+++ b/test/lib/testfile.t
@@ -0,0 +1 @@
+hello world