diff options
Diffstat (limited to 'util/devdump.pl')
-rwxr-xr-x | util/devdump.pl | 129 |
1 files changed, 70 insertions, 59 deletions
diff --git a/util/devdump.pl b/util/devdump.pl index af7bd776..e0f0f80f 100755 --- a/util/devdump.pl +++ b/util/devdump.pl @@ -17,35 +17,46 @@ use lib $ROOT.'/lib'; my $db = DBI->connect('dbi:Pg:dbname=vndb', 'vndb', undef, { RaiseError => 1 }); +sub ids { join ',', map "'$_'", @{$_[0]} } +sub idq { ids $db->selectcol_arrayref($_[0]) } + +chdir($ENV{VNDB_VAR}//'var'); # Figure out which DB entries to export -my @vids = (3, 17, 97, 183, 264, 266, 384, 407, 1910, 2932, 5922, 6438, 9837); -my $vids = join ',', @vids; -my $staff = $db->selectcol_arrayref( +my $large = ($ARGV[0]||'') eq 'large'; + +my $vids = $large ? 'SELECT id FROM vn' : ids [qw/v3 v17 v97 v183 v264 v266 v384 v407 v1910 v2932 v5922 v6438 v9837/]; +my $staff = $large ? 'SELECT id FROM staff' : idq( "SELECT c2.itemid FROM vn_staff_hist v JOIN changes c ON c.id = v.chid JOIN staff_alias_hist a ON a.aid = v.aid JOIN changes c2 ON c2.id = a.chid WHERE c.itemid IN($vids) " ."UNION " ."SELECT c2.itemid FROM vn_seiyuu_hist v JOIN changes c ON c.id = v.chid JOIN staff_alias_hist a ON a.aid = v.aid JOIN changes c2 ON c2.id = a.chid WHERE c.itemid IN($vids)" ); -my $releases = $db->selectcol_arrayref("SELECT DISTINCT c.itemid FROM releases_vn_hist v JOIN changes c ON c.id = v.chid WHERE v.vid IN($vids)"); -my $producers = $db->selectcol_arrayref("SELECT pid FROM releases_producers_hist p JOIN changes c ON c.id = p.chid WHERE c.type = 'r' AND c.itemid IN(".join(',',@$releases).")"); -my $characters = $db->selectcol_arrayref( +my $releases = $large ? 'SELECT id FROM releases' : idq( + "SELECT DISTINCT c.itemid FROM releases_vn_hist v JOIN changes c ON c.id = v.chid WHERE v.vid IN($vids)" +); +my $producers = $large ? 'SELECT id FROM producers' : idq( + "SELECT pid FROM releases_producers_hist p JOIN changes c ON c.id = p.chid WHERE c.itemid IN($releases)" +); +my $characters = $large ? 'SELECT id FROM chars' : idq( "SELECT DISTINCT c.itemid FROM chars_vns_hist e JOIN changes c ON c.id = e.chid WHERE e.vid IN($vids) " ."UNION " ."SELECT DISTINCT h.main FROM chars_vns_hist e JOIN changes c ON c.id = e.chid JOIN chars_hist h ON h.chid = e.chid WHERE e.vid IN($vids) AND h.main IS NOT NULL" ); -my $images = $db->selectcol_arrayref(q{ - SELECT image FROM chars_hist ch JOIN changes c ON c.id = ch.chid WHERE c.type = 'c' AND c.itemid IN(}.join(',',@$characters).qq{) AND ch.image IS NOT NULL - UNION SELECT image FROM vn_hist vh JOIN changes c ON c.id = vh.chid WHERE c.type = 'v' AND c.itemid IN($vids) AND vh.image IS NOT NULL - UNION SELECT scr FROM vn_screenshots_hist vs JOIN changes c ON c.id = vs.chid WHERE c.type = 'v' AND c.itemid IN($vids) -}); +my $imageids = !$large && $db->selectcol_arrayref(" + SELECT image FROM chars_hist ch JOIN changes c ON c.id = ch.chid WHERE c.itemid IN($characters) AND ch.image IS NOT NULL + UNION SELECT image FROM vn_hist vh JOIN changes c ON c.id = vh.chid WHERE c.itemid IN($vids) AND vh.image IS NOT NULL + UNION SELECT scr FROM vn_screenshots_hist vs JOIN changes c ON c.id = vs.chid WHERE c.itemid IN($vids) +"); +my $images = $large ? 'SELECT id FROM images' : ids($imageids); # Helper function to copy a table or SQL statement. Can do modifications on a # few columns (the $specials). sub copy { my($dest, $sql, $specials) = @_; + warn "$dest...\n"; $sql ||= "SELECT * FROM $dest"; $specials ||= {}; @@ -56,15 +67,11 @@ sub copy { grep !($specials->{$_} && $specials->{$_} eq 'del'), @{$s->{NAME}} }; - printf "COPY %s (%s) FROM stdin;\n", $dest, join ', ', map "\"$_\"", @cols; + printf "COPY %s (%s) FROM stdin;\n", $dest, join ', ', @cols; $sql = "SELECT " . join(',', map { my $s = $specials->{$_} || ''; - if($s eq 'user') { - qq{"$_" % 10 AS "$_"} - } else { - qq{"$_"} - } + $s eq 'user' ? "CASE WHEN vndbid_num($_) % 10 = 0 THEN NULL ELSE vndbid('u', vndbid_num($_) % 10) END AS $_" : $_; } @cols) . " FROM ($sql) AS x"; #warn $sql; $db->do("COPY ($sql) TO STDOUT"); @@ -77,14 +84,13 @@ sub copy { # Helper function to copy a full DB entry with history and all (doesn't handle references) sub copy_entry { - my($type, $tables, $ids) = @_; - $ids = join ',', @$ids; - copy changes => "SELECT * FROM changes WHERE type = '$type' AND itemid IN($ids)", {requester => 'user', ip => 'del'}; + my($tables, $ids) = @_; + copy changes => "SELECT * FROM changes WHERE itemid IN($ids)", {requester => 'user', ip => 'del'}; for(@$tables) { my $add = ''; $add = " AND vid IN($vids)" if /^releases_vn/ || /^vn_relations/ || /^chars_vns/; copy $_ => "SELECT * FROM $_ WHERE id IN($ids) $add"; - copy "${_}_hist" => "SELECT x.* FROM ${_}_hist x JOIN changes c ON c.id = x.chid WHERE c.type = '$type' AND c.itemid IN($ids) $add"; + copy "${_}_hist" => "SELECT x.* FROM ${_}_hist x JOIN changes c ON c.id = x.chid WHERE c.itemid IN($ids) $add"; } } @@ -95,6 +101,7 @@ sub copy_entry { print "-- This file replaces 'sql/all.sql'.\n"; print "\\set ON_ERROR_STOP 1\n"; + print "\\i sql/util.sql\n"; print "\\i sql/schema.sql\n"; print "\\i sql/data.sql\n"; print "\\i sql/func.sql\n"; @@ -109,65 +116,66 @@ sub copy_entry { # A few pre-defined users # This password is 'hunter2' with the default salt my $pass = '000100000801ec4185fed438752d6b3b968e2b2cd045f70005cb7e10cafdbb694a82246bd34a065b6e977e0c3dcc'; - printf "INSERT INTO users (id, username, mail, perm_usermod, passwd, email_confirmed) VALUES (%d, '%s', '%s', %s, decode('%s', 'hex'), true);\n", @$_, $pass for( - [ 2, 'admin', 'admin@vndb.org', 'true' ], - [ 3, 'user1', 'user1@vndb.org', 'false'], - [ 4, 'user2', 'user2@vndb.org', 'false'], - [ 5, 'user3', 'user3@vndb.org', 'false'], - [ 6, 'user4', 'user4@vndb.org', 'false'], - [ 7, 'user5', 'user5@vndb.org', 'false'], - [ 8, 'user6', 'user6@vndb.org', 'false'], - [ 9, 'user7', 'user7@vndb.org', 'false'], - ); + for( + [ 'u2', 'admin', 'admin@vndb.org', 'true', 'true'], + [ 'u3', 'mod', 'mod@vndb.org', 'false', 'true'], + [ 'u4', 'user1', 'user1@vndb.org', 'false', 'false'], + [ 'u5', 'user2', 'user2@vndb.org', 'false', 'false'], + [ 'u6', 'user3', 'user3@vndb.org', 'false', 'false'], + [ 'u7', 'user4', 'user4@vndb.org', 'false', 'false'], + [ 'u8', 'user5', 'user5@vndb.org', 'false', 'false'], + [ 'u9', 'user6', 'user6@vndb.org', 'false', 'false'], + ) { + printf "INSERT INTO users (id, username, email_confirmed, perm_dbmod, perm_tagmod) VALUES ('%s', '%s', true, '%s', '%s');\n", @{$_}[0,1,4,4]; + printf "INSERT INTO users_shadow (id, mail, perm_usermod, passwd) VALUES ('%s', '%s', %s, decode('%s', 'hex'));\n", @{$_}[0,2,3], $pass; + printf "INSERT INTO users_prefs (id) VALUES ('%s');\n", $_->[0]; + } print "SELECT ulist_labels_create(id) FROM users;\n"; # Tags & traits - copy tags => undef, {addedby => 'user'}; - copy 'tags_aliases'; - copy 'tags_parents'; - copy traits => undef, {addedby => 'user'}; - copy 'traits_parents'; + copy_entry [qw/tags tags_parents/], 'SELECT id FROM tags'; + copy_entry [qw/traits traits_parents/], 'SELECT id FROM traits'; # Wikidata (TODO: This could be a lot more selective) copy 'wikidata'; # Image metadata - my $image_ids = join ',', map "'$_'", @$images; - copy images => "SELECT * FROM images WHERE id IN($image_ids)"; - copy image_votes => "SELECT DISTINCT ON (id,uid%10) * FROM image_votes WHERE id IN($image_ids)", { uid => 'user' }; + copy images => "SELECT * FROM images WHERE id IN($images)", { uploader => 'user' }; + copy image_votes => "SELECT DISTINCT ON (id,vndbid('u', vndbid_num(uid)%10+10)) * FROM image_votes WHERE id IN($images)", { uid => 'user' }; # Threads (announcements) - my $threads = join ',', @{ $db->selectcol_arrayref("SELECT tid FROM threads_boards b WHERE b.type = 'an'") }; + my $threads = idq("SELECT tid FROM threads_boards b WHERE b.type = 'an'"); copy threads => "SELECT * FROM threads WHERE id IN($threads)"; copy threads_boards => "SELECT * FROM threads_boards WHERE tid IN($threads)"; copy threads_posts => "SELECT * FROM threads_posts WHERE tid IN($threads)", { uid => 'user' }; # Doc pages - copy_entry d => ['docs'], $db->selectcol_arrayref('SELECT id FROM docs'); + copy_entry ['docs'], 'SELECT id FROM docs'; # Staff - copy_entry s => [qw/staff staff_alias/], $staff; + copy_entry [qw/staff staff_alias/], $staff; # Producers (TODO: Relations) - copy_entry p => [qw/producers/], $producers; + copy_entry [qw/producers/], $producers; # Characters - copy_entry c => [qw/chars chars_traits chars_vns/], $characters; + copy_entry [qw/chars chars_traits chars_vns/], $characters; # Visual novels - copy anime => "SELECT DISTINCT a.* FROM anime a JOIN vn_anime_hist v ON v.aid = a.id JOIN changes c ON c.id = v.chid WHERE c.type = 'v' AND c.itemid IN($vids)"; - copy_entry v => [qw/vn vn_anime vn_seiyuu vn_staff vn_relations vn_screenshots/], \@vids; + copy anime => "SELECT DISTINCT a.* FROM anime a JOIN vn_anime_hist v ON v.aid = a.id JOIN changes c ON c.id = v.chid WHERE c.itemid IN($vids)"; + copy_entry [qw/vn vn_anime vn_editions vn_seiyuu vn_staff vn_relations vn_screenshots vn_titles/], $vids; # VN-related niceties - copy tags_vn => "SELECT DISTINCT ON (tag,vid,uid%10) * FROM tags_vn WHERE vid IN($vids)", {uid => 'user'}; - copy quotes => "SELECT * FROM quotes WHERE vid IN($vids)"; - my $votes = "SELECT vid, uid%8+2 AS uid, (percentile_cont((uid%8+1)::float/9) WITHIN GROUP (ORDER BY vote))::smallint AS vote, MIN(vote_date) AS vote_date" - ." FROM ulist_vns WHERE vid IN($vids) AND vote IS NOT NULL GROUP BY vid, uid%8"; - copy ulist_vns => $votes, {uid => 'user'}; - copy ulist_vns_labels => "SELECT vid, uid, 7 AS lbl FROM ($votes) x", {uid => 'user'}; + copy vn_length_votes => "SELECT DISTINCT ON (vid,vndbid_num(uid)%10) * FROM vn_length_votes WHERE NOT private AND vid IN($vids)", {uid => 'user'}; + copy tags_vn => "SELECT DISTINCT ON (tag,vid,vndbid_num(uid)%10) * FROM tags_vn WHERE vid IN($vids)", {uid => 'user'}; + copy quotes => "SELECT * FROM quotes WHERE rand IS NOT NULL AND vid IN($vids)", {addedby => 'user'}; + copy ulist_vns => "SELECT vid, vndbid('u', vndbid_num(uid)%8+2) AS uid, MIN(vote_date) AS vote_date, '{7}' AS labels, false AS c_private + , (percentile_cont((vndbid_num(uid)%8+1)::float/9) WITHIN GROUP (ORDER BY vote))::smallint AS vote + FROM ulist_vns WHERE vid IN($vids) AND vote IS NOT NULL GROUP BY vid, vndbid_num(uid)%8", {uid => 'user'}; # Releases - copy_entry r => [qw/releases releases_lang releases_media releases_platforms releases_producers releases_vn/], $releases; + copy 'drm'; + copy_entry [qw/releases releases_drm releases_media releases_platforms releases_producers releases_titles releases_vn/], $releases; print "\\i sql/tableattrs.sql\n"; print "\\i sql/triggers.sql\n"; @@ -175,16 +183,18 @@ sub copy_entry { # Update some caches print "SELECT tag_vn_calc(NULL);\n"; print "SELECT traits_chars_calc(NULL);\n"; - print "SELECT update_vncache(id) FROM vn;\n"; + print "SELECT count(*) FROM (SELECT update_vncache(id) FROM vn) x;\n"; print "SELECT update_stats_cache_full();\n"; print "SELECT update_vnvotestats();\n"; print "SELECT update_users_ulist_stats(NULL);\n"; print "SELECT update_images_cache(NULL);\n"; + print "SELECT count(*) FROM (SELECT update_search(id) FROM $_) x;\n" for (qw/chars producers vn releases staff tags traits/); print "UPDATE users u SET c_tags = (SELECT COUNT(*) FROM tags_vn v WHERE v.uid = u.id);\n"; print "UPDATE users u SET c_changes = (SELECT COUNT(*) FROM changes c WHERE c.requester = u.id);\n"; print "\\set ON_ERROR_STOP 0\n"; print "\\i sql/perms.sql\n"; + print "VACUUM ANALYZE;\n"; select STDOUT; close $OUT; @@ -192,10 +202,11 @@ sub copy_entry { - # Now figure out which images we need, and throw everything in a tarball -sub img { sprintf 'static/%s/%02d/%d.jpg', $_[0], $_[1]%100, $_[1] } -my @imgpaths = sort map { my($t,$id) = /([a-z]+)([0-9]+)/; (img($t, $id), $t eq 'sf' ? img('st', $id) : ()) } @$images; +if(!$large) { + sub img { sprintf 'static/%s/%02d/%d.jpg', $_[0], $_[1]%100, $_[1] } + my @imgpaths = sort map { my($t,$id) = /([a-z]+)([0-9]+)/; (img($t, $id), $t eq 'sf' ? img('sf.t', $id) : ()) } @$imageids; -system("tar -czf devdump.tar.gz dump.sql ".join ' ', @imgpaths); -unlink 'dump.sql'; + system("tar -czf devdump.tar.gz dump.sql ".join ' ', @imgpaths); + unlink 'dump.sql'; +} |