vor 11 Monaten · 874025e89f
--- a/Readme.md
+++ b/Readme.md
@@ -0,0 +1,3 @@
 
				+# Test::Mapper
			
 
				+
			
 
				+Map tests to things tested
			
--- a/lib/Test/Mapper.pm
+++ b/lib/Test/Mapper.pm
@@ -0,0 +1,39 @@
 
				+package Test::Mapper;
			
 
				+
			
 
				+use strict;
			
 
				+use warnings;
			
 
				+
			
 
				+#ABSTRACT: Map what parts of a codebase changing ought trigger acceptance tests
			
 
				+
			
 
				+=head1 DESCRIPTION
			
 
				+
			
 
				+The general tradition in perl unit testing is to map 'what to test' when a piece of code changes is simple:
			
 
				+
			
 
				+    lib/Foo/Bar.pm -> t/lib-Foo-Bar.t (or t/lib-Foo/Bar.t)
			
 
				+    bin/baz -> t/bin-baz.t
			
 
				+
			
 
				+Unfortunately things tend to get messy when you engage in more complicated testing, such as integration testing.
			
 
				+There, you have one-to-many relationships, but which can still be easily discerned programmatically via inspecting @INC.
			
 
				+That is unless you require() modules (or worse, read & eval/exec), in which case analysis via PPI must be brought to bear.
			
 
				+Still, most people solve that particular problem with the doctor's adage about "not doing things that hurt".
			
 
				+
			
 
				+However, acceptance tests will blow out your build server's thinking budget quickly, being a many-to-many mapping.
			
 
				+To make things worse, much of the stack isn't necessarily in $LANGUAGE_OF_CHOICE.
			
 
				+Furthermore this is not something that can simply be avoided via careful structuring.
			
 
				+
			
 
				+Knowing all this, what then shall we do?  Cheat.
			
 
				+AKA breaking an insoluble problem into many smaller soluble ones.
			
 
				+It is well within the ability of a test author to discern the route via which an acceptance test accesses a feature.
			
 
				+Indeed this is necessarily so.
			
 
				+
			
 
				+As such if we structure our mapping from this perspective life becomes quickly simplified.
			
 
				+Taking as an example an average web application, we can imagine a mapping like:
			
 
				+
			
 
				+    t/acceptance/DoFoobarFeature.t -> GET /ez/bez, POST /huth/buth, ...
			
 
				+
			
 
				+And every single so loaded "endpoint" necessarily has a number of resources loaded.
			
 
				+It is well within the realm of possibility to hit these endpoints with L<Playwright>, grab a HttpARchive and map that to the relevant source files in the repo.
			
 
				+
			
 
				+Similarly one can (in most cases) do the same thing with normal applications via C<ldd>, C<strace> and so forth.
			
 
				+
			
 
				+=cut
			
--- a/lib/Test/Mapper/DB.pm
+++ b/lib/Test/Mapper/DB.pm
@@ -0,0 +1,150 @@
 
				+package Test::Mapper::DB;
			
 
				+
			
 
				+use strict;
			
 
				+use warnings;
			
 
				+
			
 
				+# ABSTRACT: Persistent storage for what test maps where for what build.
			
 
				+
			
 
				+# We hold possibly multiple DBHes to support testing multiple products.
			
 
				+my $dbh = {};
			
 
				+
			
 
				+sub dbh {
			
 
				+    my ( $dbname ) = @_;
			
 
				+    my $schema = join("\n",(readline(DATA)));
			
 
				+
			
 
				+    $dbh //= {};
			
 
				+    return $dbh->{$dbname} if $dbh->{$dbname};
			
 
				+    File::Touch::touch($dbname) unless -f $dbname;
			
 
				+    my $db = DBI->connect( "dbi:SQLite:dbname=$dbname", "", "" );
			
 
				+
			
 
				+    if ($schema) {
			
 
				+        die "No such schema file '$schema' !" unless -f $schema;
			
 
				+        my $qq = File::Slurper::read_text($schema);
			
 
				+        $db->{sqlite_allow_multiple_statements} = 1;
			
 
				+        $db->do($qq) or die "Could not ensure database consistency: " . $db->errstr;
			
 
				+        $db->{sqlite_allow_multiple_statements} = 0;
			
 
				+    }
			
 
				+
			
 
				+    $dbh->{$dbname} = $db;
			
 
				+
			
 
				+    # Turn on fkeys
			
 
				+    $db->do("PRAGMA foreign_keys = ON") or die "Could not enable foreign keys";
			
 
				+
			
 
				+    # Turn on WALmode
			
 
				+    $db->do("PRAGMA journal_mode = WAL") or die "Could not enable WAL mode";
			
 
				+
			
 
				+    return $db;
			
 
				+}
			
 
				+
			
 
				+1;
			
 
				+
			
 
				+__DATA__
			
 
				+
			
 
				+-- Should be pretty self-explanatory, DRY
			
 
				+CREATE TABLE IF NOT EXISTS product (
			
 
				+    id INTEGER PRIMARY KEY AUTOINCREMENT,
			
 
				+    product TEXT NOT NULL UNIQUE
			
 
				+);
			
 
				+
			
 
				+CREATE TABLE IF NOT EXISTS environment (
			
 
				+    id INTEGER PRIMARY KEY AUTOINCREMENT,
			
 
				+    environment TEXT NOT NULL,
			
 
				+    product_id INTEGER NOT NULL REFERENCES product(id) ON DELETE CASCADE,
			
 
				+    UNIQUE(environment, product_id) ON CONFLICT IGNORE
			
 
				+);
			
 
				+
			
 
				+CREATE TABLE build (
			
 
				+    id INTEGER PRIMARY KEY AUTOINCREMENT,
			
 
				+    build TEXT NOT NULL,
			
 
				+    product_id INTEGER NOT NULL REFERENCES product(id) ON DELETE CASCADE,
			
 
				+    UNIQUE(build, product_id) ON CONFLICT IGNORE
			
 
				+);
			
 
				+
			
 
				+CREATE TABLE route (
			
 
				+    id INTEGER PRIMARY KEY AUTOINCREMENT,
			
 
				+    route TEXT NOT NULL,
			
 
				+    product_id INTEGER NOT NULL REFERENCES product(id) ON DELETE CASCADE,
			
 
				+    UNIQUE(route, product_id) ON CONFLICT IGNORE
			
 
				+);
			
 
				+
			
 
				+CREATE TABLE test (
			
 
				+    id INTEGER PRIMARY KEY AUTOINCREMENT,
			
 
				+    filename TEXT NOT NULL,
			
 
				+    product_id INTEGER NOT NULL REFERENCES product(id) ON DELETE CASCADE,
			
 
				+    UNIQUE(filename, product_id) ON CONFLICT IGNORE
			
 
				+);
			
 
				+
			
 
				+-- run_by is used to coordinate running, what hasn't been taken yet etc
			
 
				+-- result is a result code that visualization programs can use for historical charts
			
 
				+-- The idea here is that 'people just wanna see what failed', and this helps narrow that down
			
 
				+-- start/finish is so you can figure historical data/charts
			
 
				+CREATE TABLE test_for_build (
			
 
				+    build_id INTEGER PRIMARY KEY REFERENCES build(id),
			
 
				+    test_id  INTEGER REFERENCES test(id),
			
 
				+    run_by   TEXT,
			
 
				+    result   INTEGER,
			
 
				+    start    INTEGER NOT NULL DEFAULT CURRENT_TIMESTAMP,
			
 
				+    finish   INTEGER DEFAULT NULL,
			
 
				+    UNIQUE(build_id, test_id) ON CONFLICT ROLLBACK
			
 
				+);
			
 
				+
			
 
				+-- Actually do the mapping of test -> what files changing trigger its running
			
 
				+-- One tends to use differing resources on different environments.
			
 
				+-- It is however assumed that the tests (or the cron inserting resources/tests) discriminates in this regard.
			
 
				+CREATE TABLE resource (
			
 
				+    resource_id INTEGER PRIMARY KEY AUTOINCREMENT,
			
 
				+    environment_id INTEGER NOT NULL REFERENCES environment(id),
			
 
				+    filename TEXT NOT NULL,
			
 
				+    UNIQUE(environment_id, filename) ON CONFLICT IGNORE
			
 
				+);
			
 
				+
			
 
				+-- Indexed by resource_id, as that's how a build is done "I have x changed resources, wat run?"
			
 
				+CREATE TABLE tested_by (
			
 
				+    resource_id INTEGER PRIMARY KEY REFERENCES resource(id),
			
 
				+    test_id INTEGER NOT NULL REFERENCES test(id),
			
 
				+    UNIQUE(resource_id, test_id) ON CONFLICT IGNORE
			
 
				+);
			
 
				+
			
 
				+-- Lifecycle:
			
 
				+-- Have list of files from `git log`
			
 
				+-- Run analysis script that returns hash test_file => [source_file, ...]
			
 
				+-- INSERT INTO to_run (test_file,source_file, environment) VALUES (...);
			
 
				+CREATE VIEW to_run AS SELECT (
			
 
				+     t.filename AS test_file,
			
 
				+     t.test_id AS test_id,
			
 
				+     r.filename AS source_file,
			
 
				+     e.environment AS environment
			
 
				+) FROM resource AS r
			
 
				+JOIN tested_by AS tb ON tb.resource_id=r.resource_id
			
 
				+JOIN test AS t ON t.id=tb.test_id
			
 
				+JOIN environment ON e.id=r.environment_id
			
 
				+;
			
 
				+
			
 
				+-- TODO: make writable view for above intended for cron dumpage
			
 
				+
			
 
				+-- Lifecycle:
			
 
				+-- Cron dumps rows into resource/tested_by, when time comes to run we grab the list of stuff:
			
 
				+-- SELECT test_file FROM to_run WHERE source_file IN (...) GROUP BY test_file;
			
 
				+-- We make a run
			
 
				+-- INSERT INTO run (product, environment, build, filename) VALUES SELECT ('fooProduct', 'MsWin32', 'someSha', test_file) FROM to_run WHERE source_file IN (...) GROUP BY test_file;
			
 
				+-- We run a test
			
 
				+-- UPDATE run SET run_by='processid:90210' WHERE product='fooProduct' AND environment='MsWin32' AND build='someSha' AND test_file='actually_being_run.t';
			
 
				+-- It completes. The end.
			
 
				+-- UPDATE run SET result=1, finish=CURRENT_TIMESTAMP WHERE ...
			
 
				+CREATE VIEW run AS SELECT (
			
 
				+    p.product,
			
 
				+    e.environment,
			
 
				+    b.build,
			
 
				+    r.route,
			
 
				+    t.filename,
			
 
				+    tb.run_by,
			
 
				+    tb.result
			
 
				+) FROM product AS p
			
 
				+JOIN build AS b ON p.id=b.product_id
			
 
				+JOIN test_for_build AS tb ON b.id=tb.build_id
			
 
				+JOIN environment AS e on p.id=e.product_id
			
 
				+JOIN route AS r ON p.id=r.product_id
			
 
				+JOIN test AS t ON tb.test_id=t.id
			
 
				+;
			
 
				+
			
 
				+-- TODO: writable view to_run to make above lifecycle a real boy