DataModule.pm 10 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316
  1. package Trog::DataModule;
  2. use strict;
  3. use warnings;
  4. use UUID::Tiny;
  5. use List::Util;
  6. use File::Copy;
  7. use Mojo::File;
  8. no warnings 'experimental';
  9. use feature qw{signatures};
  10. =head1 QUERY FORMAT
  11. The $query_language and $query_help variables are presented to the user as to how to use the search box in the tCMS header.
  12. =head1 POST STRUCTURE
  13. Posts generally need to have the following:
  14. data: Brief description of content, or the content itself.
  15. content_type: What this content actually is. Used to filter into the appropriate pages.
  16. href: Primary link. This is the subject of a news post, or a link to the item itself. Can be local or remote.
  17. local_href: Backup link. Automatically created link to a static cache of the content.
  18. title: Title of the content. Used as link name for the 'href' attribute.
  19. user: User was banned for this post
  20. id: Internal identifier in datastore for the post.
  21. tags: array ref of appropriate tags.
  22. created: timestamp of creation of this version of the post
  23. version: revision # of this post.
  24. =head1 CONSTRUCTOR
  25. =head2 new(Config::Simple $config)
  26. Try not to do expensive things here.
  27. =cut
  28. sub new ($class, $config) {
  29. $config = $config->vars();
  30. return bless($config, $class);
  31. }
  32. #It is required that subclasses implement this
  33. sub lang ($self) { ... }
  34. sub help ($self) { ... }
  35. sub read ($self,$query={}) { ... }
  36. sub write ($self) { ... }
  37. sub count ($self) { ... }
  38. =head1 METHODS
  39. =head2 get(%request)
  40. Queries the data model. Should return the following:
  41. id => Filter down to just the post by ID. May be subsequently filtered by ACL, resulting in a 404 (which is good, as it does not disclose info).
  42. version => if id is passed, return the provided post version rather than the most recent one
  43. tags => ARRAYREF of tags, any one of which is required to give a result. If none are passed, no filtering is performed.
  44. acls => ARRAYREF of acl tags, any one of which is required to give result. Filter applies after tags. 'admin' ACL being present skips this filter.
  45. page => Offset multiplier for pagination.
  46. limit => Offset for pagination.
  47. like => Search query, as might be passed in the search bar.
  48. author => filter by post author
  49. If it is more efficient to filter within your data storage engine, you probably should override this method.
  50. As implemented, this takes the data as a given and filters in post.
  51. =cut
  52. sub get ($self, %request) {
  53. my $posts = $self->read(\%request);
  54. my @filtered = $self->filter(\%request, @$posts);
  55. @filtered = $self->_fixup(@filtered);
  56. @filtered = $self->paginate(\%request,@filtered);
  57. return @filtered;
  58. }
  59. sub _fixup ($self, @filtered) {
  60. @filtered = _add_post_type(@filtered);
  61. # Next, add the type of post this is
  62. @filtered = _add_media_type(@filtered);
  63. # Finally, add visibility
  64. @filtered = _add_visibility(@filtered);
  65. #urlencode spaces in filenames
  66. @filtered = map {
  67. foreach my $param (qw{href preview video_href audio_href local_href wallpaper}) {
  68. next unless exists $_->{$param};
  69. $_->{$param} =~ s/ /%20/g;
  70. }
  71. $_
  72. } @filtered;
  73. return @filtered;
  74. }
  75. sub filter ($self, $query, @filtered) {
  76. my %request = %$query; #XXX update varnames instead
  77. $request{acls} //= [];
  78. $request{tags} //=[];
  79. # If an ID is passed, just get that (and all it's prior versions)
  80. if ($request{id}) {
  81. @filtered = grep { $_->{id} eq $request{id} } @filtered if $request{id};
  82. @filtered = _dedup_versions($request{version}, @filtered);
  83. return @filtered;
  84. }
  85. @filtered = _dedup_versions(undef, @filtered);
  86. #Filter out posts which are too old
  87. #Coerce older into numeric
  88. $request{older} =~ s/[^0-9]//g if $request{older};
  89. @filtered = grep { $_->{created} < $request{older} } @filtered if $request{older};
  90. #XXX Heal bad data -- probably not needed
  91. @filtered = map { my $t = $_->{tags}; @$t = grep { defined $_ } @$t; $_ } @filtered;
  92. # Next, handle the query, tags and ACLs
  93. @filtered = grep { my $tags = $_->{tags}; grep { my $t = $_; grep {$t eq $_ } @{$request{tags}} } @$tags } @filtered if @{$request{tags}};
  94. @filtered = grep { my $tags = $_->{tags}; grep { my $t = $_; grep {$t eq $_ } @{$request{acls}} } @$tags } @filtered unless grep { $_ eq 'admin' } @{$request{acls}};
  95. @filtered = grep { $_->{title} =~ m/\Q$request{like}\E/i || $_->{data} =~ m/\Q$request{like}\E/i } @filtered if $request{like};
  96. @filtered = grep { $_->{user} eq $request{author} } @filtered if $request{author};
  97. return @filtered;
  98. }
  99. sub paginate ($self, $query, @filtered) {
  100. my %request = %$query; #XXX change varnames
  101. my $offset = int($request{limit} // 25);
  102. $offset = @filtered < $offset ? @filtered : $offset;
  103. @filtered = splice(@filtered, ( int($request{page}) -1) * $offset, $offset) if $request{page} && $request{limit};
  104. return @filtered;
  105. }
  106. sub _dedup_versions ($version=-1, @posts) {
  107. #ASSUMPTION made here - if we pass version this is direct ID query
  108. if (defined $version) {
  109. my $version_max = List::Util::max(map { $_->{version} } @posts);
  110. return map {
  111. $_->{version_max} //= $version_max;
  112. $_
  113. } grep { $_->{version} eq $version } @posts;
  114. }
  115. my @uniqids = List::Util::uniq(map { $_->{id} } @posts);
  116. my %posts_deduped;
  117. for my $id (@uniqids) {
  118. my @ofid = sort { $b->{version} <=> $a->{version} } grep { $_->{id} eq $id } @posts;
  119. my $version_max = List::Util::max(map { $_->{version } } @ofid);
  120. $posts_deduped{$id} = $ofid[0];
  121. $posts_deduped{$id}{version_max} = $version_max;
  122. }
  123. my @deduped = @posts_deduped{@uniqids};
  124. return @deduped;
  125. }
  126. #XXX this probably should be re-factored to be baked into the data from the get-go
  127. sub _add_post_type (@posts) {
  128. return map {
  129. my $post = $_;
  130. my $type = 'file';
  131. $type = 'blog' if grep { $_ eq 'blog' } @{$post->{tags}};
  132. $type = 'microblog' if grep { $_ eq 'news' } @{$post->{tags}};
  133. $type = 'profile' if grep { $_ eq 'about' } @{$post->{tags}};
  134. $type = 'series' if grep { $_ eq 'series' } @{$post->{tags}};
  135. $post->{type} = $type;
  136. $post
  137. } @posts;
  138. }
  139. sub _add_media_type (@posts) {
  140. return map {
  141. my $post = $_;
  142. $post->{content_type} //= '';
  143. $post->{is_video} = 1 if $post->{content_type} =~ m/^video\//;
  144. $post->{is_audio} = 1 if $post->{content_type} =~ m/^audio\//;
  145. $post->{is_image} = 1 if $post->{content_type} =~ m/^image\//;
  146. $post->{is_profile} = 1 if grep {$_ eq 'about' } @{$post->{tags}};
  147. $post
  148. } @posts;
  149. }
  150. sub _add_visibility (@posts) {
  151. return map {
  152. my $post = $_;
  153. my @visibilities = grep { my $tag = $_; grep { $_ eq $tag } qw{private unlisted public} } @{$post->{tags}};
  154. $post->{visibility} = $visibilities[0];
  155. $post
  156. } @posts;
  157. }
  158. =head2 count() = INT $num
  159. Returns the total number of posts.
  160. Used to determine paginator parameters.
  161. =cut
  162. =head2 add(@posts) = BOOL $failed_or_not
  163. Add the provided posts to the datastore.
  164. If any post already exists with the same id, a new post with a version higher than it will be added.
  165. Passes an array of new posts to add to the data store module's write() function.
  166. You probably won't want to override this.
  167. =cut
  168. sub add ($self, @posts) {
  169. my @to_write;
  170. foreach my $post (@posts) {
  171. $post->{id} //= UUID::Tiny::create_uuid_as_string(UUID::Tiny::UUID_V1, UUID::Tiny::UUID_NS_DNS);
  172. $post->{created} = time();
  173. my @existing_posts = $self->get( id => $post->{id} );
  174. if (@existing_posts) {
  175. my $existing_post = $existing_posts[0];
  176. $post->{version} = $existing_post->{version};
  177. $post->{version}++;
  178. }
  179. $post->{version} //= 0;
  180. $post = _process($post);
  181. push @to_write, $post;
  182. }
  183. $self->write(\@to_write);
  184. return 0;
  185. }
  186. #XXX this level of post-processing seems gross, but may be unavoidable
  187. # Not actually a subprocess, kek
  188. sub _process ($post) {
  189. $post->{href} = _handle_upload($post->{file}, $post->{id}) if $post->{file};
  190. $post->{preview} = _handle_upload($post->{preview_file}, $post->{id}) if $post->{preview_file};
  191. $post->{wallpaper} = _handle_upload($post->{wallpaper_file}, $post->{id}) if $post->{wallpaper_file};
  192. $post->{preview} = $post->{href} if $post->{app} eq 'image';
  193. delete $post->{app};
  194. delete $post->{file};
  195. delete $post->{preview_file};
  196. delete $post->{scheme};
  197. delete $post->{route};
  198. delete $post->{domain};
  199. # Handle acls/tags
  200. $post->{tags} //= [];
  201. @{$post->{tags}} = grep { my $subj = $_; !grep { $_ eq $subj} qw{public private unlisted} } @{$post->{tags}};
  202. push(@{$post->{tags}}, delete $post->{acls}) if $post->{visibility} eq 'private';
  203. push(@{$post->{tags}}, delete $post->{visibility});
  204. # Add the 'series' tag if we are in a series, restrict to relevant acl
  205. if ($post->{series}) {
  206. push(@{$post->{tags}}, 'series');
  207. push(@{$post->{tags}}, $post->{series});
  208. }
  209. #Filter adding the same acl twice
  210. @{$post->{tags}} = List::Util::uniq(@{$post->{tags}});
  211. # Handle multimedia content types
  212. if ($post->{href}) {
  213. my $mf = Mojo::File->new("www/$post->{href}");
  214. my $ext = '.'.$mf->extname();
  215. $post->{content_type} = Plack::MIME->mime_type($ext) if $ext;
  216. }
  217. if ($post->{video_href}) {
  218. my $mf = Mojo::File->new("www/$post->{video_href}");
  219. my $ext = '.'.$mf->extname();
  220. $post->{video_content_type} = Plack::MIME->mime_type($ext) if $ext;
  221. }
  222. if ($post->{audio_href}) {
  223. my $mf = Mojo::File->new("www/$post->{audio_href}");
  224. my $ext = '.'.$mf->extname();
  225. $post->{audio_content_type} = Plack::MIME->mime_type($ext) if $ext;
  226. }
  227. return $post;
  228. }
  229. sub _handle_upload ($file, $uuid) {
  230. my $f = $file->{tempname};
  231. my $newname = "$uuid.$file->{filename}";
  232. File::Copy::move($f, "www/assets/$newname");
  233. return "/assets/$newname";
  234. }
  235. =head2 delete(@posts)
  236. Delete the following posts.
  237. Will remove all versions of said post.
  238. You should override this, it is a stub here.
  239. =cut
  240. sub delete ($self) { die 'stub' }
  241. 1;