ArielGlenn has uploaded a new change for review. ( https://gerrit.wikimedia.org/r/396931 )
Change subject: get rid of datasets1001 mount on snapshot hosts ...................................................................... get rid of datasets1001 mount on snapshot hosts As part of this cleanup: get rid of secondary wikidumps.conf file which contained references to paths on that filesystem change all references to wikidumps.conf; these should now all point to wikidumps.conf.dumps in declaration of managed directories and paths for use by shell scripts, reoder and compact the code get rid of all references to 'otherdir' on snapshots, it's no longer used Bug: T182540 Change-Id: Iabfd52355aced16f5f4693b7c53be965e72652d2 --- M modules/profile/manifests/dumps/generation/worker/common.pp M modules/snapshot/files/cron/create-media-per-project-lists.sh M modules/snapshot/files/cron/dump-global-blocks.sh M modules/snapshot/files/cron/dumpcategoriesrdf.sh M modules/snapshot/files/cron/dumpcirrussearch.sh M modules/snapshot/files/cron/dumpcontentxlation.sh M modules/snapshot/manifests/cron/categoriesrdf.pp M modules/snapshot/manifests/cron/cirrussearch.pp M modules/snapshot/manifests/cron/dump_global_blocks.pp M modules/snapshot/manifests/cron/pagetitles.pp M modules/snapshot/manifests/dumps.pp M modules/snapshot/manifests/dumps/configs.pp M modules/snapshot/manifests/dumps/cron.pp M modules/snapshot/manifests/dumps/dirs.pp M modules/snapshot/templates/set_dump_dirs.sh.erb 15 files changed, 32 insertions(+), 74 deletions(-) git pull ssh://gerrit.wikimedia.org:29418/operations/puppet refs/changes/31/396931/1 diff --git a/modules/profile/manifests/dumps/generation/worker/common.pp b/modules/profile/manifests/dumps/generation/worker/common.pp index 1ecf6fb..5c319c5 100644 --- a/modules/profile/manifests/dumps/generation/worker/common.pp +++ b/modules/profile/manifests/dumps/generation/worker/common.pp @@ -1,11 +1,11 @@ -class profile::dumps::generation::worker::common { +class profile::dumps::generation::worker::common( +) { # mw packages and dependencies require ::profile::mediawiki::scap_proxy require ::profile::mediawiki::common require ::profile::mediawiki::nutcracker $xmldumpsmount = '/mnt/dumpsdata' - $miscdumpsmount = '/mnt/data' class { '::dumpsuser': } @@ -13,21 +13,14 @@ mountpoint => $xmldumpsmount, server => 'dumpsdata1001.eqiad.wmnet', } - snapshot::dumps::nfsmount { 'datasetmount': - mountpoint => $miscdumpsmount, - server => 'dataset1001.wikimedia.org', - } - # dataset server config files, # stages files, dblists, html templates class { '::snapshot::dumps::dirs': user => 'dumpsgen', xmldumpsmount => $xmldumpsmount, - miscdumpsmount => $miscdumpsmount, } class { '::snapshot::dumps': xmldumpsmount => $xmldumpsmount, - miscdumpsmount => $miscdumpsmount, } # scap3 deployment of dump scripts diff --git a/modules/snapshot/files/cron/create-media-per-project-lists.sh b/modules/snapshot/files/cron/create-media-per-project-lists.sh index b51512b..6c5abb6 100755 --- a/modules/snapshot/files/cron/create-media-per-project-lists.sh +++ b/modules/snapshot/files/cron/create-media-per-project-lists.sh @@ -9,7 +9,7 @@ DATE=`/bin/date '+%Y%m%d'` outputdir="${cronsdir}/imageinfo/$DATE" -configfile="${confsdir}/wikidump.conf:media" +configfile="${confsdir}/wikidump.conf.dumps:media" errors=0 cd "$repodir" diff --git a/modules/snapshot/files/cron/dump-global-blocks.sh b/modules/snapshot/files/cron/dump-global-blocks.sh index 90f80ea..4f5416a 100644 --- a/modules/snapshot/files/cron/dump-global-blocks.sh +++ b/modules/snapshot/files/cron/dump-global-blocks.sh @@ -76,12 +76,12 @@ echo "Usage: $0 [--config <pathtofile>] [--dryrun]" >& 2 echo >& 2 echo " --config path to configuration file for dump generation" >& 2 - echo " (default value: ${confsdir}/wikidump.conf" >& 2 + echo " (default value: ${confsdir}/wikidump.conf.dumps" >& 2 echo " --dryrun don't run dump, show what would have been done" >& 2 exit 1 } -configfile="${confsdir}/wikidump.conf" +configfile="${confsdir}/wikidump.conf.dumps" dryrun="false" while [ $# -gt 0 ]; do diff --git a/modules/snapshot/files/cron/dumpcategoriesrdf.sh b/modules/snapshot/files/cron/dumpcategoriesrdf.sh index abb175e..d55a692 100755 --- a/modules/snapshot/files/cron/dumpcategoriesrdf.sh +++ b/modules/snapshot/files/cron/dumpcategoriesrdf.sh @@ -13,13 +13,13 @@ echo "Usage: $0 --list wikis.dblist [--config <pathtofile>] [--dryrun]" echo echo " --config path to configuration file for dump generation" - echo " (default value: ${confsdir}/wikidump.conf" + echo " (default value: ${confsdir}/wikidump.conf.dumps" echo " --list file containing list of the wikis to dump" echo " --dryrun don't run dump, show what would have been done" exit 1 } -configFile="${confsdir}/wikidump.conf" +configFile="${confsdir}/wikidump.conf.dumps" dryrun="false" dumpFormat="ttl" dbList="categories-rdf" diff --git a/modules/snapshot/files/cron/dumpcirrussearch.sh b/modules/snapshot/files/cron/dumpcirrussearch.sh index 61c2cce0..9a7eeb6 100644 --- a/modules/snapshot/files/cron/dumpcirrussearch.sh +++ b/modules/snapshot/files/cron/dumpcirrussearch.sh @@ -13,12 +13,12 @@ echo "Usage: $0 [--config <pathtofile>] [--dryrun]" echo echo " --config path to configuration file for dump generation" - echo " (default value: ${confsdir}/wikidump.conf" + echo " (default value: ${confsdir}/wikidump.conf.dumps" echo " --dryrun don't run dump, show what would have been done" exit 1 } -configFile="${confsdir}/wikidump.conf" +configFile="${confsdir}/wikidump.conf.dumps" dryrun="false" while [ $# -gt 0 ]; do diff --git a/modules/snapshot/files/cron/dumpcontentxlation.sh b/modules/snapshot/files/cron/dumpcontentxlation.sh index b40a37b..c580a7e 100644 --- a/modules/snapshot/files/cron/dumpcontentxlation.sh +++ b/modules/snapshot/files/cron/dumpcontentxlation.sh @@ -26,7 +26,7 @@ echo "Usage: $0 [--config <pathtofile>] [--dryrun]" echo echo " --config path to configuration file for dump generation" - echo " (default value: ${confsdir}/wikidump.conf" + echo " (default value: ${confsdir}/wikidump.conf.dumps" echo " --dryrun display dump command instead of running it" exit 1 } @@ -35,7 +35,7 @@ # MAIN ##################### -configfile="${confsdir}/wikidump.conf" +configfile="${confsdir}/wikidump.conf.dumps" dryrun="false" ##################### diff --git a/modules/snapshot/manifests/cron/categoriesrdf.pp b/modules/snapshot/manifests/cron/categoriesrdf.pp index 8312683..6d21ac1 100644 --- a/modules/snapshot/manifests/cron/categoriesrdf.pp +++ b/modules/snapshot/manifests/cron/categoriesrdf.pp @@ -25,7 +25,7 @@ cron { 'categoriesrdf-dump': ensure => 'present', - command => "${scriptpath} --config ${confsdir}/wikidump.conf --list ${apachedir}/dblists/categories-rdf.dblist", + command => "${scriptpath} --config ${confsdir}/wikidump.conf.dumps --list ${apachedir}/dblists/categories-rdf.dblist", environment => 'MAILTO=ops-du...@wikimedia.org', user => $user, minute => '0', diff --git a/modules/snapshot/manifests/cron/cirrussearch.pp b/modules/snapshot/manifests/cron/cirrussearch.pp index 1babe11..ec17dd5 100644 --- a/modules/snapshot/manifests/cron/cirrussearch.pp +++ b/modules/snapshot/manifests/cron/cirrussearch.pp @@ -19,7 +19,7 @@ cron { 'cirrussearch-dump': ensure => 'present', - command => "${scriptpath} --config ${confsdir}/wikidump.conf", + command => "${scriptpath} --config ${confsdir}/wikidump.conf.dumps", environment => 'MAILTO=ops-du...@wikimedia.org', user => $user, minute => '15', diff --git a/modules/snapshot/manifests/cron/dump_global_blocks.pp b/modules/snapshot/manifests/cron/dump_global_blocks.pp index 25b4e7f..97e6dd2 100644 --- a/modules/snapshot/manifests/cron/dump_global_blocks.pp +++ b/modules/snapshot/manifests/cron/dump_global_blocks.pp @@ -12,7 +12,7 @@ cron { 'global_blocks_dump': ensure => 'present', - command => "/usr/local/bin/dump-global-blocks.sh --config ${confsdir}/wikidump.conf", + command => "/usr/local/bin/dump-global-blocks.sh --config ${confsdir}/wikidump.conf.dumps", environment => 'MAILTO=ops-du...@wikimedia.org', user => $user, minute => '15', diff --git a/modules/snapshot/manifests/cron/pagetitles.pp b/modules/snapshot/manifests/cron/pagetitles.pp index 3574143..0ddb782 100644 --- a/modules/snapshot/manifests/cron/pagetitles.pp +++ b/modules/snapshot/manifests/cron/pagetitles.pp @@ -9,7 +9,7 @@ ensure => 'present', environment => 'MAILTO=ops-du...@wikimedia.org', user => $user, - command => "cd ${repodir}; python onallwikis.py --configfile ${confsdir}/wikidump.conf:monitor --filenameformat '{w}-{d}-all-titles-in-ns-0.gz' --outdir '${cronsdir}/pagetitles/{d}' --query \"'select page_title from page where page_namespace=0;'\"", + command => "cd ${repodir}; python onallwikis.py --configfile ${confsdir}/wikidump.conf.dumps:monitor --filenameformat '{w}-{d}-all-titles-in-ns-0.gz' --outdir '${cronsdir}/pagetitles/{d}' --query \"'select page_title from page where page_namespace=0;'\"", minute => '10', hour => '8', } @@ -18,7 +18,7 @@ ensure => 'present', environment => 'MAILTO=ops-du...@wikimedia.org', user => $user, - command => "cd ${repodir}; python onallwikis.py --configfile ${confsdir}/wikidump.conf:monitor --filenameformat '{w}-{d}-all-media-titles.gz' --outdir '${cronsdir}/mediatitles/{d}' --query \"'select page_title from page where page_namespace=6;'\"", + command => "cd ${repodir}; python onallwikis.py --configfile ${confsdir}/wikidump.conf.dumps:monitor --filenameformat '{w}-{d}-all-media-titles.gz' --outdir '${cronsdir}/mediatitles/{d}' --query \"'select page_title from page where page_namespace=6;'\"", minute => '50', hour => '8', } diff --git a/modules/snapshot/manifests/dumps.pp b/modules/snapshot/manifests/dumps.pp index e2248cc..5c678e6 100644 --- a/modules/snapshot/manifests/dumps.pp +++ b/modules/snapshot/manifests/dumps.pp @@ -1,11 +1,9 @@ class snapshot::dumps( $xmldumpsmount = undef, - $miscdumpsmount = undef, ) { include ::snapshot::dumps::packages class { '::snapshot::dumps::configs': xmldumpsmount => $xmldumpsmount, - miscdumpsmount => $miscdumpsmount, } include ::snapshot::dumps::dblists include ::snapshot::dumps::templates diff --git a/modules/snapshot/manifests/dumps/configs.pp b/modules/snapshot/manifests/dumps/configs.pp index 1fb7ed4..e77eeaa 100644 --- a/modules/snapshot/manifests/dumps/configs.pp +++ b/modules/snapshot/manifests/dumps/configs.pp @@ -1,6 +1,5 @@ class snapshot::dumps::configs( $xmldumpsmount = undef, - $miscdumpsmount = undef, ) { $dblistsdir = $snapshot::dumps::dirs::dblistsdir $apachedir = $snapshot::dumps::dirs::apachedir @@ -134,14 +133,6 @@ }, } - # for jobs running on dataset host - snapshot::dumps::wikiconf { 'wikidump.conf': - configtype => 'allwikis', - config => $config, - publicdir => "${miscdumpsmount}/xmldatadumps/public", - privatedir => "${miscdumpsmount}/xmldatadumps/private", - tempdir => "${miscdumpsmount}/xmldatadumps/temp", - } # for xml/sql dumps running on dumpsdata host snapshot::dumps::wikiconf { 'wikidump.conf.dumps': configtype => 'allwikis', diff --git a/modules/snapshot/manifests/dumps/cron.pp b/modules/snapshot/manifests/dumps/cron.pp index 3adb2b8..dee3c72 100644 --- a/modules/snapshot/manifests/dumps/cron.pp +++ b/modules/snapshot/manifests/dumps/cron.pp @@ -28,7 +28,7 @@ } # fixme there is an implicit dependency on - # wikidump.conf.* plus some stage files, make explicit + # wikidump.conf.dumps plus some stage files, make explicit cron { 'fulldumps_rest': ensure => 'present', diff --git a/modules/snapshot/manifests/dumps/dirs.pp b/modules/snapshot/manifests/dumps/dirs.pp index d54bd13..72603bd 100644 --- a/modules/snapshot/manifests/dumps/dirs.pp +++ b/modules/snapshot/manifests/dumps/dirs.pp @@ -1,72 +1,49 @@ class snapshot::dumps::dirs( $user = undef, $xmldumpsmount = undef, - $miscdumpsmount = undef, ) { + # need to create and manage these, and have them + # available for a shell script that sets vars with + # their values for inclusion by other scripts $dumpsdir = '/etc/dumps' file { $dumpsdir: ensure => 'directory', - path => $dumpsdir, mode => '0755', owner => 'root', group => 'root', } - $miscdumpsdir = "${miscdumpsmount}/xmldatadumps" - $xmldumpsdir = "${xmldumpsmount}/xmldatadumps" - $cronsdir = "${xmldumpsmount}/otherdumps" - - $apachedir = '/srv/mediawiki' $confsdir = "${dumpsdir}/confs" - - file { $confsdir: - ensure => 'directory', - path => $confsdir, - mode => '0755', - owner => 'root', - group => 'root', - } - $dblistsdir = "${dumpsdir}/dblists" - file { $dblistsdir: - ensure => 'directory', - path => $dblistsdir, - mode => '0755', - owner => 'root', - group => 'root', - } - $stagesdir = "${dumpsdir}/stages" - file { $stagesdir: + $templsdir = "${dumpsdir}/templs" + file { [ $confsdir, $dblistsdir, $stagesdir, + $templsdir ]: ensure => 'directory', - path => $stagesdir, mode => '0755', owner => 'root', group => 'root', } + # dir will be written in by the user $cachedir = "${dumpsdir}/cache" file { $cachedir: ensure => 'directory', - path => $cachedir, mode => '0755', owner => $user, group => 'root', } - $templsdir = "${dumpsdir}/templs" - file { $templsdir: - ensure => 'directory', - path => $templsdir, - mode => '0755', - owner => 'root', - group => 'root', - } - - $otherdir = "${miscdumpsdir}/public/other" - + # need these only for the shell script that sets + # vars with their values for other scripts + $xmldumpsdir = "${xmldumpsmount}/xmldatadumps" + $cronsdir = "${xmldumpsmount}/otherdumps" + $apachedir = '/srv/mediawiki' $repodir = '/srv/deployment/dumps/dumps/xmldumps-backup' + # here's that script; it gets sourced by + # various cron jobs so they know where to + # write output, where to find dump scripts, etc. file { '/usr/local/etc/set_dump_dirs.sh': ensure => 'present', path => '/usr/local/etc/set_dump_dirs.sh', diff --git a/modules/snapshot/templates/set_dump_dirs.sh.erb b/modules/snapshot/templates/set_dump_dirs.sh.erb index 6313c23..5a846da 100644 --- a/modules/snapshot/templates/set_dump_dirs.sh.erb +++ b/modules/snapshot/templates/set_dump_dirs.sh.erb @@ -5,7 +5,6 @@ repodir="<%= scope.lookupvar('snapshot::dumps::dirs::repodir') -%>" xmldumpsdir="<%= scope.lookupvar('snapshot::dumps::dirs::xmldumpsdir') -%>" miscdumpsdir="<%= scope.lookupvar('snapshot::dumps::dirs::miscdumpsdir') -%>" -otherdir="<%= scope.lookupvar('snapshot::dumps::dirs::otherdir') -%>" cronsdir="<%= scope.lookupvar('snapshot::dumps::dirs::cronsdir') -%>" dumpsdir="<%= scope.lookupvar('snapshot::dumps::dirs::dumpsdir') -%>" dblistsdir="<%= scope.lookupvar('snapshot::dumps::dirs::dblistsdir') -%>" -- To view, visit https://gerrit.wikimedia.org/r/396931 To unsubscribe, visit https://gerrit.wikimedia.org/r/settings Gerrit-MessageType: newchange Gerrit-Change-Id: Iabfd52355aced16f5f4693b7c53be965e72652d2 Gerrit-PatchSet: 1 Gerrit-Project: operations/puppet Gerrit-Branch: production Gerrit-Owner: ArielGlenn <ar...@wikimedia.org> _______________________________________________ MediaWiki-commits mailing list MediaWiki-commits@lists.wikimedia.org https://lists.wikimedia.org/mailman/listinfo/mediawiki-commits