1
0
mirror of https://github.com/gnosygnu/xowa.git synced 2026-03-02 03:49:30 +00:00

v4.5.7.1706

This commit is contained in:
gnosygnu
2017-06-25 21:14:55 -04:00
parent 37d5550c4f
commit c659d5fd91
166 changed files with 3492 additions and 2147 deletions

View File

@@ -18,7 +18,7 @@
<div id="mw-content-text" lang="en" dir="ltr" class="mw-content-ltr">
<div id="toc" class="toc">
<div id="toctitle">
<div id="toctitle" class="toctitle">
<h2>
Contents
</h2>

View File

@@ -35,7 +35,7 @@
XOWA can import a wiki using a plain text file and a command-line.
</p>
<div id="toc" class="toc">
<div id="toctitle">
<div id="toctitle" class="toctitle">
<h2>
Contents
</h2>

View File

@@ -58,7 +58,7 @@
<br>
</p>
<div id="toc" class="toc">
<div id="toctitle">
<div id="toctitle" class="toctitle">
<h2>
Contents
</h2>
@@ -441,8 +441,8 @@ app.bldr.cmds {
add ('simple.wikipedia.org' , 'wiki.mass_parse.exec') {
cfg {
num_wkrs = 8; load_all_templates = 'y'; load_all_imglinks = 'y'; indexer_enabled = 'y';
cleanup_interval = 50; hzip_enabled = 'y'; hdiff_enabled ='y'; manual_now = '2017-04-01 00:00:00'
num_wkrs = 8; load_all_templates = 'y'; cleanup_interval = 50; hzip_enabled = 'y'; hdiff_enabled ='y'; manual_now = '2016-08-01 01:02:03';
load_all_imglinks = 'y';
// uncomment the following 3 lines if using the build script as a "worker" helping a "server"
// num_pages_in_pool = 32000;
@@ -521,8 +521,7 @@ app.bldr.cmds {
add ('www.wikidata.org' , 'wiki.page_props');
add ('www.wikidata.org' , 'wiki.categorylinks');
add ('www.wikidata.org' , 'wiki.redirect') {commit_interval = 1000; progress_interval = 100; cleanup_interval = 100;}
add ('www.wikidata.org' , 'util.cleanup') {delete_tmp = 'y'; delete_by_match('*.xml|*.sql|*.bz2|*.gz');}
// add ('www.wikidata.org' , 'util.cleanup') {delete_tmp = 'y'; delete_by_match('*.xml|*.sql|*.bz2|*.gz');}
add ('commons.wikimedia.org' , 'util.cleanup') {delete_all = 'y';}
add ('commons.wikimedia.org' , 'util.download') {dump_type = 'pages-articles';}
add ('commons.wikimedia.org' , 'util.download') {dump_type = 'image';}
@@ -536,8 +535,7 @@ app.bldr.cmds {
add ('commons.wikimedia.org' , 'file.page_regy') {build_commons = 'y'}
add ('commons.wikimedia.org' , 'wiki.page_dump.make');
add ('commons.wikimedia.org' , 'wiki.redirect') {commit_interval = 1000; progress_interval = 100; cleanup_interval = 100;}
add ('commons.wikimedia.org' , 'util.cleanup') {delete_tmp = 'y'; delete_by_match('*.xml|*.sql|*.bz2|*.gz');}
// add ('commons.wikimedia.org' , 'util.cleanup') {delete_tmp = 'y'; delete_by_match('*.xml|*.sql|*.bz2|*.gz');}
add ('en.wikipedia.org' , 'util.download') {dump_type = 'pages-articles';}
add ('en.wikipedia.org' , 'util.download') {dump_type = 'pagelinks';}
add ('en.wikipedia.org' , 'util.download') {dump_type = 'categorylinks';}
@@ -545,7 +543,6 @@ app.bldr.cmds {
add ('en.wikipedia.org' , 'util.download') {dump_type = 'image';}
add ('en.wikipedia.org' , 'util.download') {dump_type = 'imagelinks';}
*/
/*
// en.wikipedia.org
add ('en.wikipedia.org' , 'text.init');
@@ -571,25 +568,28 @@ app.bldr.cmds {
}
}
}
add ('en.wikipedia.org' , 'search.word__link_count');
add ('en.wikipedia.org' , 'search.word__link_count')
add ('en.wikipedia.org' , 'wiki.page_props');
add ('en.wikipedia.org' , 'wiki.categorylinks');
add ('en.wikipedia.org' , 'file.page_regy') {build_commons = 'n'}
// add ('en.wikipedia.org' , 'wiki.mass_parse.resume');
add ('en.wikipedia.org' , 'wiki.mass_parse.init') {cfg {ns_ids = '0|4|100|14|8';}}
add ('en.wikipedia.org' , 'wiki.mass_parse.exec') {cfg {
num_wkrs = 8; load_all_templates = 'y'; load_all_imglinks = 'y'; indexer_enabled = 'y';
cleanup_interval = 50; hzip_enabled = 'y'; hdiff_enabled ='y'; manual_now = '2017-04-01 00:00:00'
}
}
*/
/*
add ('en.wikipedia.org' , 'file.page_regy') {build_commons = 'n'}
add ('en.wikipedia.org' , 'wiki.mass_parse.init') {cfg {ns_ids = '0|4|100|14|8';}}
// add ('en.wikipedia.org' , 'wiki.mass_parse.resume');
add ('en.wikipedia.org' , 'wiki.mass_parse.exec') {cfg {
num_wkrs = 8; load_all_templates = 'y'; load_ifexists_ns = '*'; cleanup_interval = 25; hzip_enabled = 'y'; hdiff_enabled ='y'; manual_now = '2017-01-01 01:02:03';}
// num_wkrs = 1; load_all_templates = 'n'; load_all_imglnks = 'n'; cleanup_interval = 50; hzip_enabled = 'y'; hdiff_enabled ='y'; manual_now = '2016-07-28 01:02:03';}
}
add ('en.wikipedia.org' , 'wiki.mass_parse.make');
// SELECT * FROM image ORDER BY img_timestamp DESC LIMIT 20; // 20170306194400
// SELECT * FROM page WHERE page_namespace = 6 ORDER BY page_touched DESC LIMIT 20; // 20170302024207
// SELECT * FROM xowa_cfg WHERE cfg_key = 'props.modified_latest';
*/
/*
add ('en.wikipedia.org' , 'file.lnki_temp') {
commit_interval = 10000; progress_interval = 50; cleanup_interval = 50; select_size = 25;
ns_ids = '0|4|14|100|12|8|6|10|828|108|118|446|710|2300|2302|2600';
hdump_bldr {enabled = 'y'; hzip_enabled = 'y'; hzip_diff = 'y';}
}
*/
/*
add ('commons.wikimedia.org' , 'file.page_regy') {build_commons = 'y'}
add ('en.wikipedia.org' , 'file.page_regy') {build_commons = 'n';}
add ('en.wikipedia.org' , 'file.lnki_regy');
@@ -597,15 +597,9 @@ app.bldr.cmds {
add ('en.wikipedia.org' , 'file.orig_regy');
add ('en.wikipedia.org' , 'file.xfer_temp.thumb');
// SELECT * FROM orig_regy WHERE lnki_ttl = 'BSicon_CONTr.svg';
// SELECT * FROM page_regy WHERE src_ttl = 'BSicon_CONTr.svg';
// SELECT Count(*) FROM xfer_regy WHERE xfer_status = 0;
// SELECT * FROM xfer_regy WHERE xfer_status = 0 AND lnki_page_id = 372692; --en.w:Featured_picture_candidates
add ('en.wikipedia.org' , 'file.xfer_regy');
add ('en.wikipedia.org' , 'file.xfer_regy_update');
*/
/*
add ('en.wikipedia.org' , 'file.fsdb_make') {
commit_interval = 1000; progress_interval = 200; select_interval = 10000;
@@ -636,10 +630,7 @@ app.bldr.run;
2016-10-12: explicitly set web_access_enabled to y
</li>
<li>
2017-02-02: added multi-threaded version and new options
</li>
<li>
2017-05-12: added full-text search
2017-02-02: updated script for multi-threaded version and new options
</li>
</ul>

View File

@@ -32,7 +32,7 @@
<div id="mw-content-text" lang="en" dir="ltr" class="mw-content-ltr">
<div id="toc" class="toc">
<div id="toctitle">
<div id="toctitle" class="toctitle">
<h2>
Contents
</h2>

View File

@@ -58,7 +58,7 @@
<br>
</p>
<div id="toc" class="toc">
<div id="toctitle">
<div id="toctitle" class="toctitle">
<h2>
Contents
</h2>
@@ -441,8 +441,8 @@ app.bldr.cmds {
add ('simple.wikipedia.org' , 'wiki.mass_parse.exec') {
cfg {
num_wkrs = 8; load_all_templates = 'y'; load_all_imglinks = 'y'; indexer_enabled = 'y';
cleanup_interval = 50; hzip_enabled = 'y'; hdiff_enabled ='y'; manual_now = '2017-04-01 00:00:00'
num_wkrs = 8; load_all_templates = 'y'; cleanup_interval = 50; hzip_enabled = 'y'; hdiff_enabled ='y'; manual_now = '2016-08-01 01:02:03';
load_all_imglinks = 'y';
// uncomment the following 3 lines if using the build script as a "worker" helping a "server"
// num_pages_in_pool = 32000;
@@ -521,8 +521,7 @@ app.bldr.cmds {
add ('www.wikidata.org' , 'wiki.page_props');
add ('www.wikidata.org' , 'wiki.categorylinks');
add ('www.wikidata.org' , 'wiki.redirect') {commit_interval = 1000; progress_interval = 100; cleanup_interval = 100;}
add ('www.wikidata.org' , 'util.cleanup') {delete_tmp = 'y'; delete_by_match('*.xml|*.sql|*.bz2|*.gz');}
// add ('www.wikidata.org' , 'util.cleanup') {delete_tmp = 'y'; delete_by_match('*.xml|*.sql|*.bz2|*.gz');}
add ('commons.wikimedia.org' , 'util.cleanup') {delete_all = 'y';}
add ('commons.wikimedia.org' , 'util.download') {dump_type = 'pages-articles';}
add ('commons.wikimedia.org' , 'util.download') {dump_type = 'image';}
@@ -536,8 +535,7 @@ app.bldr.cmds {
add ('commons.wikimedia.org' , 'file.page_regy') {build_commons = 'y'}
add ('commons.wikimedia.org' , 'wiki.page_dump.make');
add ('commons.wikimedia.org' , 'wiki.redirect') {commit_interval = 1000; progress_interval = 100; cleanup_interval = 100;}
add ('commons.wikimedia.org' , 'util.cleanup') {delete_tmp = 'y'; delete_by_match('*.xml|*.sql|*.bz2|*.gz');}
// add ('commons.wikimedia.org' , 'util.cleanup') {delete_tmp = 'y'; delete_by_match('*.xml|*.sql|*.bz2|*.gz');}
add ('en.wikipedia.org' , 'util.download') {dump_type = 'pages-articles';}
add ('en.wikipedia.org' , 'util.download') {dump_type = 'pagelinks';}
add ('en.wikipedia.org' , 'util.download') {dump_type = 'categorylinks';}
@@ -545,7 +543,6 @@ app.bldr.cmds {
add ('en.wikipedia.org' , 'util.download') {dump_type = 'image';}
add ('en.wikipedia.org' , 'util.download') {dump_type = 'imagelinks';}
*/
/*
// en.wikipedia.org
add ('en.wikipedia.org' , 'text.init');
@@ -571,25 +568,28 @@ app.bldr.cmds {
}
}
}
add ('en.wikipedia.org' , 'search.word__link_count');
add ('en.wikipedia.org' , 'search.word__link_count')
add ('en.wikipedia.org' , 'wiki.page_props');
add ('en.wikipedia.org' , 'wiki.categorylinks');
add ('en.wikipedia.org' , 'file.page_regy') {build_commons = 'n'}
// add ('en.wikipedia.org' , 'wiki.mass_parse.resume');
add ('en.wikipedia.org' , 'wiki.mass_parse.init') {cfg {ns_ids = '0|4|100|14|8';}}
add ('en.wikipedia.org' , 'wiki.mass_parse.exec') {cfg {
num_wkrs = 8; load_all_templates = 'y'; load_all_imglinks = 'y'; indexer_enabled = 'y';
cleanup_interval = 50; hzip_enabled = 'y'; hdiff_enabled ='y'; manual_now = '2017-04-01 00:00:00'
}
}
*/
/*
add ('en.wikipedia.org' , 'file.page_regy') {build_commons = 'n'}
add ('en.wikipedia.org' , 'wiki.mass_parse.init') {cfg {ns_ids = '0|4|100|14|8';}}
// add ('en.wikipedia.org' , 'wiki.mass_parse.resume');
add ('en.wikipedia.org' , 'wiki.mass_parse.exec') {cfg {
num_wkrs = 8; load_all_templates = 'y'; load_ifexists_ns = '*'; cleanup_interval = 25; hzip_enabled = 'y'; hdiff_enabled ='y'; manual_now = '2017-01-01 01:02:03';}
// num_wkrs = 1; load_all_templates = 'n'; load_all_imglnks = 'n'; cleanup_interval = 50; hzip_enabled = 'y'; hdiff_enabled ='y'; manual_now = '2016-07-28 01:02:03';}
}
add ('en.wikipedia.org' , 'wiki.mass_parse.make');
// SELECT * FROM image ORDER BY img_timestamp DESC LIMIT 20; // 20170306194400
// SELECT * FROM page WHERE page_namespace = 6 ORDER BY page_touched DESC LIMIT 20; // 20170302024207
// SELECT * FROM xowa_cfg WHERE cfg_key = 'props.modified_latest';
*/
/*
add ('en.wikipedia.org' , 'file.lnki_temp') {
commit_interval = 10000; progress_interval = 50; cleanup_interval = 50; select_size = 25;
ns_ids = '0|4|14|100|12|8|6|10|828|108|118|446|710|2300|2302|2600';
hdump_bldr {enabled = 'y'; hzip_enabled = 'y'; hzip_diff = 'y';}
}
*/
/*
add ('commons.wikimedia.org' , 'file.page_regy') {build_commons = 'y'}
add ('en.wikipedia.org' , 'file.page_regy') {build_commons = 'n';}
add ('en.wikipedia.org' , 'file.lnki_regy');
@@ -597,15 +597,9 @@ app.bldr.cmds {
add ('en.wikipedia.org' , 'file.orig_regy');
add ('en.wikipedia.org' , 'file.xfer_temp.thumb');
// SELECT * FROM orig_regy WHERE lnki_ttl = 'BSicon_CONTr.svg';
// SELECT * FROM page_regy WHERE src_ttl = 'BSicon_CONTr.svg';
// SELECT Count(*) FROM xfer_regy WHERE xfer_status = 0;
// SELECT * FROM xfer_regy WHERE xfer_status = 0 AND lnki_page_id = 372692; --en.w:Featured_picture_candidates
add ('en.wikipedia.org' , 'file.xfer_regy');
add ('en.wikipedia.org' , 'file.xfer_regy_update');
*/
/*
add ('en.wikipedia.org' , 'file.fsdb_make') {
commit_interval = 1000; progress_interval = 200; select_interval = 10000;
@@ -636,10 +630,7 @@ app.bldr.run;
2016-10-12: explicitly set web_access_enabled to y
</li>
<li>
2017-02-02: added multi-threaded version and new options
</li>
<li>
2017-05-12: added full-text search
2017-02-02: updated script for multi-threaded version and new options
</li>
</ul>

View File

@@ -32,7 +32,7 @@
<div id="mw-content-text" lang="en" dir="ltr" class="mw-content-ltr">
<div id="toc" class="toc">
<div id="toctitle">
<div id="toctitle" class="toctitle">
<h2>
Contents
</h2>

View File

@@ -18,7 +18,7 @@
<div id="mw-content-text" lang="en" dir="ltr" class="mw-content-ltr">
<div id="toc" class="toc">
<div id="toctitle">
<div id="toctitle" class="toctitle">
<h2>
Contents
</h2>

View File

@@ -21,7 +21,7 @@
The Wikimedia data dump files are released in compressed forms: <a href="http://en.wikipedia.org/bzip2" rel="nofollow" class="external text">bzip2</a> or <a href="http://en.wikipedia.org/gzip" rel="nofollow" class="external text">gzip</a>. Prior to v0.5.2, XOWA required that the files be uncompressed in order to read them. v0.5.2 allows the user the option to either read directly from the compressed or uncompressed file.
</p>
<div id="toc" class="toc">
<div id="toctitle">
<div id="toctitle" class="toctitle">
<h2>
Contents
</h2>

View File

@@ -18,7 +18,7 @@
<div id="mw-content-text" lang="en" dir="ltr" class="mw-content-ltr">
<div id="toc" class="toc">
<div id="toctitle">
<div id="toctitle" class="toctitle">
<h2>
Contents
</h2>

View File

@@ -18,7 +18,7 @@
<div id="mw-content-text" lang="en" dir="ltr" class="mw-content-ltr">
<div id="toc" class="toc">
<div id="toctitle">
<div id="toctitle" class="toctitle">
<h2>
Contents
</h2>

View File

@@ -42,7 +42,7 @@
</p>
<ul>
<li>
<code>[ 50 GB; 03 h]</code> Import the Commons wiki with category level 2. See <a href="http://xowa.org/home/wiki/Dashboard/Import/Offline.html" id="xolnki_2" title="Dashboard/Import/Offline" class="xowa-visited">Dashboard/Import/Offline</a>
<code>[ 50 GB; 03 h]</code> Import the Commons wiki with category level 2. See <a href="http://xowa.org/home/wiki/Dashboard/Import/Offline.html" id="xolnki_2" title="Dashboard/Import/Offline">Dashboard/Import/Offline</a>
</li>
<li>
<code>[ 50 GB; 02 h]</code> Download and unzip commonswiki-latest-image.sql.gz

View File

@@ -61,7 +61,7 @@
The file format is controlled by other arguments
</p>
<div id="toc" class="toc">
<div id="toctitle">
<div id="toctitle" class="toctitle">
<h2>
Contents
</h2>

View File

@@ -21,7 +21,7 @@
Certain files are best displayed in dedicated third party applications. For example, a video file cannot be played natively in a HTML browser, but can be played in a media player.
</p>
<div id="toc" class="toc">
<div id="toctitle">
<div id="toctitle" class="toctitle">
<h2>
Contents
</h2>

View File

@@ -36,7 +36,7 @@
For more information about the config, see the section below.
</p>
<div id="toc" class="toc">
<div id="toctitle">
<div id="toctitle" class="toctitle">
<h2>
Contents
</h2>

View File

@@ -46,7 +46,7 @@
</li>
</ul>
<p>
If you do succeed in installing ImageMagick/Inkscape, please help XOWA and detail your experience. See <a href="http://xowa.org/home/wiki/Help/Feedback.html" id="xolnki_3" title="Help/Feedback" class="xowa-visited">Help/Feedback</a>.
If you do succeed in installing ImageMagick/Inkscape, please help XOWA and detail your experience. See <a href="http://xowa.org/home/wiki/Help/Feedback.html" id="xolnki_3" title="Help/Feedback">Help/Feedback</a>.
</p>
</div>

View File

@@ -21,7 +21,7 @@
If you run into issues with this install, then you may will need to install the components manually. The sections below provide more detail.
</p>
<div id="toc" class="toc">
<div id="toctitle">
<div id="toctitle" class="toctitle">
<h2>
Contents
</h2>

View File

@@ -18,7 +18,7 @@
<div id="mw-content-text" lang="en" dir="ltr" class="mw-content-ltr">
<div id="toc" class="toc">
<div id="toctitle">
<div id="toctitle" class="toctitle">
<h2>
Contents
</h2>

View File

@@ -21,7 +21,7 @@
SWT is a core GUI library in XOWA.
</p>
<div id="toc" class="toc">
<div id="toctitle">
<div id="toctitle" class="toctitle">
<h2>
Contents
</h2>

View File

@@ -18,7 +18,7 @@
<div id="mw-content-text" lang="en" dir="ltr" class="mw-content-ltr">
<div id="toc" class="toc">
<div id="toctitle">
<div id="toctitle" class="toctitle">
<h2>
Contents
</h2>