ArielGlenn has uploaded a new change for review.
https://gerrit.wikimedia.org/r/236487
Change subject: dumps: big wikis do abstracts in 4 chunks, no need for page
ranges
......................................................................
dumps: big wikis do abstracts in 4 chunks, no need for page ranges
Change-Id: Ibb5e14fb7075636acddeccbdce059794ac3fabe5
---
M modules/snapshot/manifests/dumps/configs.pp
M modules/snapshot/templates/wikidump.conf.erb
2 files changed, 12 insertions(+), 0 deletions(-)
git pull ssh://gerrit.wikimedia.org:29418/operations/puppet
refs/changes/87/236487/1
diff --git a/modules/snapshot/manifests/dumps/configs.pp
b/modules/snapshot/manifests/dumps/configs.pp
index fc23d2c..5b9e7d0 100644
--- a/modules/snapshot/manifests/dumps/configs.pp
+++ b/modules/snapshot/manifests/dumps/configs.pp
@@ -22,46 +22,57 @@
ruwiki => {
pagesPerChunkHistory => '256900,895900,1280900,2000000',
pagesPerChunkAbstract => '1200000',
+ chunksForAbstract => '4',
},
eswiki => {
pagesPerChunkHistory => '190300,671500,1627200,2000000',
pagesPerChunkAbstract => '1500000',
+ chunksForAbstract => '4',
},
dewiki => {
pagesPerChunkHistory => '33640,1446760,2569200,3000000',
pagesPerChunkAbstract => '2000000',
+ chunksForAbstract => '4',
},
ptwiki => {
pagesPerChunkHistory => '137500,668700,1208900,2000000',
pagesPerChunkAbstract => '1000000',
+ chunksForAbstract => '4',
},
plwiki => {
pagesPerChunkHistory => '208000,422000,818900,2000000',
pagesPerChunkAbstract => '800000',
+ chunksForAbstract => '4',
},
nlwiki => {
pagesPerChunkHistory => '200800,490800,934600,2000000',
pagesPerChunkAbstract => '1000000',
+ chunksForAbstract => '4',
},
frwiki => {
pagesPerChunkHistory => '348700,965200,2331100,3000000',
pagesPerChunkAbstract => '1900000',
+ chunksForAbstract => '4',
},
itwiki => {
pagesPerChunkHistory => '335400,941600,1180900,2000000',
pagesPerChunkAbstract => '1200000',
+ chunksForAbstract => '4',
},
jawiki => {
pagesPerChunkHistory => '149600,801600,408900,2000000',
pagesPerChunkAbstract => '800000',
+ chunksForAbstract => '4',
},
commonswiki => {
pagesPerChunkHistory =>
'6440000,8960000,11260000,20000000',
pagesPerChunkAbstract => '11000000',
+ chunksForAbstract => '4',
},
wikidatawiki => {
pagesPerChunkHistory =>
'2300000,4500000,8600000,10000000',
pagesPerChunkAbstract => '5800000',
+ chunksForAbstract => '4',
},
},
},
diff --git a/modules/snapshot/templates/wikidump.conf.erb
b/modules/snapshot/templates/wikidump.conf.erb
index 3c4f280..2000bcc 100644
--- a/modules/snapshot/templates/wikidump.conf.erb
+++ b/modules/snapshot/templates/wikidump.conf.erb
@@ -67,6 +67,7 @@
[<%= [w] %>]
pagesPerChunkHistory=<%=
@config[@configtype]['wikis'][w]['pagesPerChunkHistory'] %>
pagesPerChunkAbstract=<%=
@config[@configtype]['wikis'][w]['pagesPerChunkAbstract'] %>
+chunksForAbstract=<%= @config[@configtype]['wikis'][w]['chunksForAbstract'] %>
<% end -%>
<% end -%>
--
To view, visit https://gerrit.wikimedia.org/r/236487
To unsubscribe, visit https://gerrit.wikimedia.org/r/settings
Gerrit-MessageType: newchange
Gerrit-Change-Id: Ibb5e14fb7075636acddeccbdce059794ac3fabe5
Gerrit-PatchSet: 1
Gerrit-Project: operations/puppet
Gerrit-Branch: production
Gerrit-Owner: ArielGlenn <[email protected]>
_______________________________________________
MediaWiki-commits mailing list
[email protected]
https://lists.wikimedia.org/mailman/listinfo/mediawiki-commits