diff options
Diffstat (limited to 'www/wiki/maintenance/mssql/tables.sql')
-rw-r--r-- | www/wiki/maintenance/mssql/tables.sql | 1509 |
1 files changed, 1509 insertions, 0 deletions
diff --git a/www/wiki/maintenance/mssql/tables.sql b/www/wiki/maintenance/mssql/tables.sql new file mode 100644 index 00000000..67746f04 --- /dev/null +++ b/www/wiki/maintenance/mssql/tables.sql @@ -0,0 +1,1509 @@ +-- Experimental table definitions for Microsoft SQL Server with +-- content-holding fields switched to explicit BINARY charset. +-- ------------------------------------------------------------ + +-- SQL to create the initial tables for the MediaWiki database. +-- This is read and executed by the install script; you should +-- not have to run it by itself unless doing a manual install. + +-- +-- General notes: +-- +-- The comments in this and other files are +-- replaced with the defined table prefix by the installer +-- and updater scripts. If you are installing or running +-- updates manually, you will need to manually insert the +-- table prefix if any when running these scripts. +-- + + +-- +-- The user table contains basic account information, +-- authentication keys, etc. +-- +-- Some multi-wiki sites may share a single central user table +-- between separate wikis using the $wgSharedDB setting. +-- +-- Note that when a external authentication plugin is used, +-- user table entries still need to be created to store +-- preferences and to key tracking information in the other +-- tables. + +-- LINE:53 +CREATE TABLE /*_*/mwuser ( + user_id INT NOT NULL PRIMARY KEY IDENTITY(0,1), + user_name NVARCHAR(255) NOT NULL UNIQUE DEFAULT '', + user_real_name NVARCHAR(255) NOT NULL DEFAULT '', + user_password NVARCHAR(255) NOT NULL DEFAULT '', + user_newpassword NVARCHAR(255) NOT NULL DEFAULT '', + user_newpass_time varchar(14) NULL DEFAULT NULL, + user_email NVARCHAR(255) NOT NULL DEFAULT '', + user_touched varchar(14) NOT NULL DEFAULT '', + user_token NCHAR(32) NOT NULL DEFAULT '', + user_email_authenticated varchar(14) DEFAULT NULL, + user_email_token NCHAR(32) DEFAULT '', + user_email_token_expires varchar(14) DEFAULT NULL, + user_registration varchar(14) DEFAULT NULL, + user_editcount INT NULL DEFAULT NULL, + user_password_expires varchar(14) DEFAULT NULL +); +CREATE UNIQUE INDEX /*i*/user_name ON /*_*/mwuser (user_name); +CREATE INDEX /*i*/user_email_token ON /*_*/mwuser (user_email_token); +CREATE INDEX /*i*/user_email ON /*_*/mwuser (user_email); + +-- Insert a dummy user to represent anons +INSERT INTO /*_*/mwuser (user_name) VALUES ('##Anonymous##'); + +-- +-- The "actor" table associates user names or IP addresses with integers for +-- the benefit of other tables that need to refer to either logged-in or +-- logged-out users. If something can only ever be done by logged-in users, it +-- can refer to the user table directly. +-- +CREATE TABLE /*_*/actor ( + actor_id bigint unsigned NOT NULL CONSTRAINT PK_actor PRIMARY KEY IDENTITY(0,1), + actor_user int unsigned, + actor_name nvarchar(255) NOT NULL +); +CREATE UNIQUE INDEX /*i*/actor_user ON /*_*/actor (actor_user); +CREATE UNIQUE INDEX /*i*/actor_name ON /*_*/actor (actor_name); + +-- Insert a dummy actor to represent no actor +INSERT INTO /*_*/actor (actor_name) VALUES ('##Anonymous##'); + +-- +-- User permissions have been broken out to a separate table; +-- this allows sites with a shared user table to have different +-- permissions assigned to a user in each project. +-- +-- This table replaces the old user_rights field which used a +-- comma-separated nvarchar(max). +CREATE TABLE /*_*/user_groups ( + ug_user INT NOT NULL REFERENCES /*_*/mwuser(user_id) ON DELETE CASCADE, + ug_group NVARCHAR(255) NOT NULL DEFAULT '', + ug_expiry varchar(14) DEFAULT NULL, + PRIMARY KEY(ug_user, ug_group) +); +CREATE INDEX /*i*/ug_group ON /*_*/user_groups(ug_group); +CREATE INDEX /*i*/ug_expiry ON /*_*/user_groups(ug_expiry); + +-- Stores the groups the user has once belonged to. +-- The user may still belong to these groups (check user_groups). +-- Users are not autopromoted to groups from which they were removed. +CREATE TABLE /*_*/user_former_groups ( + ufg_user INT NOT NULL REFERENCES /*_*/mwuser(user_id) ON DELETE CASCADE, + ufg_group nvarchar(255) NOT NULL default '' +); +CREATE UNIQUE INDEX /*i*/ufg_user_group ON /*_*/user_former_groups (ufg_user,ufg_group); + +-- Stores notifications of user talk page changes, for the display +-- of the "you have new messages" box +-- Changed user_id column to user_id to avoid clashing with user_id function +CREATE TABLE /*_*/user_newtalk ( + user_id INT NOT NULL REFERENCES /*_*/mwuser(user_id) ON DELETE CASCADE, + user_ip NVARCHAR(40) NOT NULL DEFAULT '', + user_last_timestamp varchar(14) DEFAULT NULL, +); +CREATE INDEX /*i*/un_user_id ON /*_*/user_newtalk (user_id); +CREATE INDEX /*i*/un_user_ip ON /*_*/user_newtalk (user_ip); + +-- +-- User preferences and other fun stuff +-- replaces old user.user_options nvarchar(max) +-- +CREATE TABLE /*_*/user_properties ( + up_user INT NOT NULL REFERENCES /*_*/mwuser(user_id) ON DELETE CASCADE, + up_property NVARCHAR(255) NOT NULL, + up_value NVARCHAR(MAX), +); +CREATE UNIQUE CLUSTERED INDEX /*i*/user_properties_user_property ON /*_*/user_properties (up_user,up_property); +CREATE INDEX /*i*/user_properties_property ON /*_*/user_properties (up_property); + +-- +-- This table contains a user's bot passwords: passwords that allow access to +-- the account via the API with limited rights. +-- +CREATE TABLE /*_*/bot_passwords ( + bp_user int NOT NULL REFERENCES /*_*/mwuser(user_id) ON DELETE CASCADE, + bp_app_id nvarchar(32) NOT NULL, + bp_password nvarchar(255) NOT NULL, + bp_token nvarchar(255) NOT NULL, + bp_restrictions nvarchar(max) NOT NULL, + bp_grants nvarchar(max) NOT NULL, + PRIMARY KEY (bp_user, bp_app_id) +); + + +-- +-- Edits, blocks, and other actions typically have a textual comment describing +-- the action. They are stored here to reduce the size of the main tables, and +-- to allow for deduplication. +-- +-- Deduplication is currently best-effort to avoid locking on inserts that +-- would be required for strict deduplication. There MAY be multiple rows with +-- the same comment_text and comment_data. +-- +CREATE TABLE /*_*/comment ( + comment_id bigint unsigned NOT NULL PRIMARY KEY IDENTITY(0,1), + comment_hash INT NOT NULL, + comment_text nvarchar(max) NOT NULL, + comment_data nvarchar(max) +); +-- Index used for deduplication. +CREATE INDEX /*i*/comment_hash ON /*_*/comment (comment_hash); + +-- dummy row for FKs. Hash is intentionally wrong so CommentStore won't match it. +INSERT INTO /*_*/comment (comment_hash, comment_text) VALUES (-1, '** dummy **'); + + +-- +-- Core of the wiki: each page has an entry here which identifies +-- it by title and contains some essential metadata. +-- +CREATE TABLE /*_*/page ( + page_id INT NOT NULL PRIMARY KEY IDENTITY(0,1), + page_namespace INT NOT NULL, + page_title NVARCHAR(255) NOT NULL, + page_restrictions NVARCHAR(255) NOT NULL, + page_is_redirect BIT NOT NULL DEFAULT 0, + page_is_new BIT NOT NULL DEFAULT 0, + page_random real NOT NULL DEFAULT RAND(), + page_touched varchar(14) NOT NULL default '', + page_links_updated varchar(14) DEFAULT NULL, + page_latest INT, -- FK inserted later + page_len INT NOT NULL, + page_content_model nvarchar(32) default null, + page_lang VARBINARY(35) DEFAULT NULL +); +CREATE UNIQUE INDEX /*i*/name_title ON /*_*/page (page_namespace,page_title); +CREATE INDEX /*i*/page_random ON /*_*/page (page_random); +CREATE INDEX /*i*/page_len ON /*_*/page (page_len); +CREATE INDEX /*i*/page_redirect_namespace_len ON /*_*/page (page_is_redirect, page_namespace, page_len); + +-- insert a dummy page +INSERT INTO /*_*/page (page_namespace, page_title, page_restrictions, page_latest, page_len) VALUES (-1,'','',0,0); + +-- +-- Every edit of a page creates also a revision row. +-- This stores metadata about the revision, and a reference +-- to the TEXT storage backend. +-- +CREATE TABLE /*_*/revision ( + rev_id INT NOT NULL UNIQUE IDENTITY(0,1), + rev_page INT NOT NULL REFERENCES /*_*/page(page_id) ON DELETE CASCADE, + rev_text_id INT NOT NULL CONSTRAINT DF_rev_text_id DEFAULT 0, -- FK added later + rev_comment NVARCHAR(255) NOT NULL CONSTRAINT DF_rev_comment DEFAULT '', + rev_user INT REFERENCES /*_*/mwuser(user_id) ON DELETE SET NULL, + rev_user_text NVARCHAR(255) NOT NULL DEFAULT '', + rev_timestamp varchar(14) NOT NULL default '', + rev_minor_edit BIT NOT NULL DEFAULT 0, + rev_deleted TINYINT NOT NULL DEFAULT 0, + rev_len INT, + rev_parent_id INT DEFAULT NULL REFERENCES /*_*/revision(rev_id), + rev_sha1 nvarchar(32) not null default '', + rev_content_model nvarchar(32) default null, + rev_content_format nvarchar(64) default null +); +CREATE UNIQUE CLUSTERED INDEX /*i*/rev_page_id ON /*_*/revision (rev_page, rev_id); +CREATE INDEX /*i*/rev_timestamp ON /*_*/revision (rev_timestamp); +CREATE INDEX /*i*/page_timestamp ON /*_*/revision (rev_page,rev_timestamp); +CREATE INDEX /*i*/user_timestamp ON /*_*/revision (rev_user,rev_timestamp); +CREATE INDEX /*i*/usertext_timestamp ON /*_*/revision (rev_user_text,rev_timestamp); +CREATE INDEX /*i*/page_user_timestamp ON /*_*/revision (rev_page,rev_user,rev_timestamp); + +-- insert a dummy revision +INSERT INTO /*_*/revision (rev_page,rev_text_id,rev_comment,rev_user,rev_len) VALUES (0,0,'',0,0); + +ALTER TABLE /*_*/page ADD CONSTRAINT FK_page_latest_page_id FOREIGN KEY (page_latest) REFERENCES /*_*/revision(rev_id); + +-- +-- Temporary tables to avoid blocking on an alter of revision. +-- +-- On large wikis like the English Wikipedia, altering the revision table is a +-- months-long process. This table is being created to avoid such an alter, and +-- will be merged back into revision in the future. +-- +CREATE TABLE /*_*/revision_comment_temp ( + revcomment_rev INT NOT NULL CONSTRAINT FK_revcomment_rev FOREIGN KEY REFERENCES /*_*/revision(rev_id) ON DELETE CASCADE, + revcomment_comment_id bigint unsigned NOT NULL CONSTRAINT FK_revcomment_comment_id FOREIGN KEY REFERENCES /*_*/comment(comment_id), + CONSTRAINT PK_revision_comment_temp PRIMARY KEY (revcomment_rev, revcomment_comment_id) +); +CREATE UNIQUE INDEX /*i*/revcomment_rev ON /*_*/revision_comment_temp (revcomment_rev); + +CREATE TABLE /*_*/revision_actor_temp ( + revactor_rev int unsigned NOT NULL CONSTRAINT FK_revactor_rev FOREIGN KEY REFERENCES /*_*/revision(rev_id) ON DELETE CASCADE, + revactor_actor bigint unsigned NOT NULL, + revactor_timestamp varchar(14) NOT NULL CONSTRAINT DF_revactor_timestamp DEFAULT '', + revactor_page int unsigned NOT NULL, + CONSTRAINT PK_revision_actor_temp PRIMARY KEY (revactor_rev, revactor_actor) +); +CREATE UNIQUE INDEX /*i*/revactor_rev ON /*_*/revision_actor_temp (revactor_rev); +CREATE INDEX /*i*/actor_timestamp ON /*_*/revision_actor_temp (revactor_actor,revactor_timestamp); +CREATE INDEX /*i*/page_actor_timestamp ON /*_*/revision_actor_temp (revactor_page,revactor_actor,revactor_timestamp); + +-- +-- Holds TEXT of individual page revisions. +-- +-- Field names are a holdover from the 'old' revisions table in +-- MediaWiki 1.4 and earlier: an upgrade will transform that +-- table INTo the 'text' table to minimize unnecessary churning +-- and downtime. If upgrading, the other fields will be left unused. +CREATE TABLE /*_*/text ( + old_id INT NOT NULL PRIMARY KEY IDENTITY(0,1), + old_text nvarchar(max) NOT NULL, + old_flags NVARCHAR(255) NOT NULL, +); + +-- insert a dummy text +INSERT INTO /*_*/text (old_text,old_flags) VALUES ('',''); + +ALTER TABLE /*_*/revision ADD CONSTRAINT FK_rev_text_id_old_id FOREIGN KEY (rev_text_id) REFERENCES /*_*/text(old_id) ON DELETE CASCADE; + +-- +-- Holding area for deleted articles, which may be viewed +-- or restored by admins through the Special:Undelete interface. +-- The fields generally correspond to the page, revision, and text +-- fields, with several caveats. +-- Cannot reasonably create views on this table, due to the presence of TEXT +-- columns. +CREATE TABLE /*_*/archive ( + ar_id int NOT NULL PRIMARY KEY IDENTITY, + ar_namespace SMALLINT NOT NULL DEFAULT 0, + ar_title NVARCHAR(255) NOT NULL DEFAULT '', + ar_comment NVARCHAR(255) NOT NULL CONSTRAINT DF_ar_comment DEFAULT '', + ar_comment_id bigint unsigned NOT NULL CONSTRAINT DF_ar_comment_id DEFAULT 0 CONSTRAINT FK_ar_comment_id FOREIGN KEY REFERENCES /*_*/comment(comment_id), + ar_user INT CONSTRAINT ar_user__user_id__fk FOREIGN KEY REFERENCES /*_*/mwuser(user_id), + ar_user_text NVARCHAR(255) NOT NULL CONSTRAINT DF_ar_user_text DEFAULT '', + ar_actor bigint unsigned NOT NULL CONSTRAINT DF_ar_actor DEFAULT 0, + ar_timestamp varchar(14) NOT NULL default '', + ar_minor_edit BIT NOT NULL DEFAULT 0, + ar_rev_id INT NOT NULL, -- NOT a FK, the row gets deleted from revision and moved here + ar_text_id INT NOT NULL CONSTRAINT DF_ar_text_id DEFAULT 0 CONSTRAINT ar_text_id__old_id__fk FOREIGN KEY REFERENCES /*_*/text(old_id) ON DELETE CASCADE, + ar_deleted TINYINT NOT NULL DEFAULT 0, + ar_len INT, + ar_page_id INT NULL, -- NOT a FK, the row gets deleted from page and moved here + ar_parent_id INT NULL, -- NOT FK + ar_sha1 nvarchar(32) default null, + ar_content_model nvarchar(32) DEFAULT NULL, + ar_content_format nvarchar(64) DEFAULT NULL +); +CREATE INDEX /*i*/name_title_timestamp ON /*_*/archive (ar_namespace,ar_title,ar_timestamp); +CREATE INDEX /*i*/ar_usertext_timestamp ON /*_*/archive (ar_user_text,ar_timestamp); +CREATE INDEX /*i*/ar_actor_timestamp ON /*_*/archive (ar_actor,ar_timestamp); +CREATE INDEX /*i*/ar_revid ON /*_*/archive (ar_rev_id); + + +-- +-- Slots represent an n:m relation between revisions and content objects. +-- A content object can have a specific "role" in one or more revisions. +-- Each revision can have multiple content objects, each having a different role. +-- +CREATE TABLE /*_*/slots ( + + -- reference to rev_id + slot_revision_id bigint unsigned NOT NULL, + + -- reference to role_id + slot_role_id smallint unsigned NOT NULL CONSTRAINT FK_slots_slot_role FOREIGN KEY REFERENCES slot_roles(role_id), + + -- reference to content_id + slot_content_id bigint unsigned NOT NULL CONSTRAINT FK_slots_content_id FOREIGN KEY REFERENCES content(content_id), + + -- The revision ID of the revision that originated the slot's content. + -- To find revisions that changed slots, look for slot_origin = slot_revision_id. + slot_origin bigint NOT NULL, + + CONSTRAINT PK_slots PRIMARY KEY (slot_revision_id, slot_role_id) +); + +-- Index for finding revisions that modified a specific slot +CREATE INDEX /*i*/slot_revision_origin_role ON /*_*/slots (slot_revision_id, slot_origin, slot_role_id); + +-- +-- The content table represents content objects. It's primary purpose is to provide the necessary +-- meta-data for loading and interpreting a serialized data blob to create a content object. +-- +CREATE TABLE /*_*/content ( + + -- ID of the content object + content_id bigint unsigned NOT NULL CONSTRAINT PK_content PRIMARY KEY IDENTITY, + + -- Nominal size of the content object (not necessarily of the serialized blob) + content_size int unsigned NOT NULL, + + -- Nominal hash of the content object (not necessarily of the serialized blob) + content_sha1 varchar(32) NOT NULL, + + -- reference to model_id + content_model smallint unsigned NOT NULL CONSTRAINT FK_content_content_models FOREIGN KEY REFERENCES /*_*/content_models(model_id), + + -- URL-like address of the content blob + content_address nvarchar(255) NOT NULL +); + +-- +-- Normalization table for role names +-- +CREATE TABLE /*_*/slot_roles ( + role_id smallint NOT NULL CONSTRAINT PK_slot_roles PRIMARY KEY IDENTITY, + role_name nvarchar(64) NOT NULL +); + +-- Index for looking of the internal ID of for a name +CREATE UNIQUE INDEX /*i*/role_name ON /*_*/slot_roles (role_name); + +-- +-- Normalization table for content model names +-- +CREATE TABLE /*_*/content_models ( + model_id smallint NOT NULL CONSTRAINT PK_content_models PRIMARY KEY IDENTITY, + model_name nvarchar(64) NOT NULL +); + +-- Index for looking of the internal ID of for a name +CREATE UNIQUE INDEX /*i*/model_name ON /*_*/content_models (model_name); + + +-- +-- Track page-to-page hyperlinks within the wiki. +-- +CREATE TABLE /*_*/pagelinks ( + pl_from INT NOT NULL REFERENCES /*_*/page(page_id) ON DELETE CASCADE, + pl_from_namespace int NOT NULL DEFAULT 0, + pl_namespace INT NOT NULL DEFAULT 0, + pl_title NVARCHAR(255) NOT NULL DEFAULT '', +); +CREATE UNIQUE INDEX /*i*/pl_from ON /*_*/pagelinks (pl_from,pl_namespace,pl_title); +CREATE UNIQUE INDEX /*i*/pl_namespace ON /*_*/pagelinks (pl_namespace,pl_title,pl_from); +CREATE INDEX /*i*/pl_backlinks_namespace ON /*_*/pagelinks (pl_from_namespace,pl_namespace,pl_title,pl_from); + + +-- +-- Track template inclusions. +-- +CREATE TABLE /*_*/templatelinks ( + tl_from int NOT NULL REFERENCES /*_*/page(page_id) ON DELETE CASCADE, + tl_from_namespace int NOT NULL default 0, + tl_namespace int NOT NULL default 0, + tl_title nvarchar(255) NOT NULL default '' +); + +CREATE UNIQUE INDEX /*i*/tl_from ON /*_*/templatelinks (tl_from,tl_namespace,tl_title); +CREATE UNIQUE INDEX /*i*/tl_namespace ON /*_*/templatelinks (tl_namespace,tl_title,tl_from); +CREATE INDEX /*i*/tl_backlinks_namespace ON /*_*/templatelinks (tl_from_namespace,tl_namespace,tl_title,tl_from); + + +-- +-- Track links to images *used inline* +-- We don't distinguish live from broken links here, so +-- they do not need to be changed on upload/removal. +-- +CREATE TABLE /*_*/imagelinks ( + -- Key to page_id of the page containing the image / media link. + il_from int NOT NULL REFERENCES /*_*/page(page_id) ON DELETE CASCADE, + il_from_namespace int NOT NULL default 0, + + -- Filename of target image. + -- This is also the page_title of the file's description page; + -- all such pages are in namespace 6 (NS_FILE). + il_to nvarchar(255) NOT NULL default '' +); + +CREATE UNIQUE INDEX /*i*/il_from ON /*_*/imagelinks (il_from,il_to); +CREATE UNIQUE INDEX /*i*/il_to ON /*_*/imagelinks (il_to,il_from); +CREATE INDEX /*i*/il_backlinks_namespace ON /*_*/imagelinks (il_from_namespace,il_to,il_from); + +-- +-- Track category inclusions *used inline* +-- This tracks a single level of category membership +-- +CREATE TABLE /*_*/categorylinks ( + -- Key to page_id of the page defined as a category member. + cl_from int NOT NULL REFERENCES /*_*/page(page_id) ON DELETE CASCADE, + + -- Name of the category. + -- This is also the page_title of the category's description page; + -- all such pages are in namespace 14 (NS_CATEGORY). + cl_to nvarchar(255) NOT NULL default '', + + -- A binary string obtained by applying a sortkey generation algorithm + -- (Collation::getSortKey()) to page_title, or cl_sortkey_prefix . "\n" + -- . page_title if cl_sortkey_prefix is nonempty. + cl_sortkey varbinary(230) NOT NULL default 0x, + + -- A prefix for the raw sortkey manually specified by the user, either via + -- [[Category:Foo|prefix]] or {{defaultsort:prefix}}. If nonempty, it's + -- concatenated with a line break followed by the page title before the sortkey + -- conversion algorithm is run. We store this so that we can update + -- collations without reparsing all pages. + -- Note: If you change the length of this field, you also need to change + -- code in LinksUpdate.php. See T27254. + cl_sortkey_prefix varbinary(255) NOT NULL default 0x, + + -- This isn't really used at present. Provided for an optional + -- sorting method by approximate addition time. + cl_timestamp varchar(14) NOT NULL, + + -- Stores $wgCategoryCollation at the time cl_sortkey was generated. This + -- can be used to install new collation versions, tracking which rows are not + -- yet updated. '' means no collation, this is a legacy row that needs to be + -- updated by updateCollation.php. In the future, it might be possible to + -- specify different collations per category. + cl_collation nvarchar(32) NOT NULL default '', + + -- Stores whether cl_from is a category, file, or other page, so we can + -- paginate the three categories separately. This never has to be updated + -- after the page is created, since none of these page types can be moved to + -- any other. + cl_type varchar(10) NOT NULL default 'page', + -- SQL server doesn't have enums, so we approximate with this + CONSTRAINT cl_type_ckc CHECK (cl_type IN('page', 'subcat', 'file')) +); + +CREATE UNIQUE INDEX /*i*/cl_from ON /*_*/categorylinks (cl_from,cl_to); + +-- We always sort within a given category, and within a given type. FIXME: +-- Formerly this index didn't cover cl_type (since that didn't exist), so old +-- callers won't be using an index: fix this? +CREATE INDEX /*i*/cl_sortkey ON /*_*/categorylinks (cl_to,cl_type,cl_sortkey,cl_from); + +-- Used by the API (and some extensions) +CREATE INDEX /*i*/cl_timestamp ON /*_*/categorylinks (cl_to,cl_timestamp); + +-- Used when updating collation (e.g. updateCollation.php) +CREATE INDEX /*i*/cl_collation_ext ON /*_*/categorylinks (cl_collation, cl_to, cl_type, cl_from); + +-- +-- Track all existing categories. Something is a category if 1) it has an entry +-- somewhere in categorylinks, or 2) it has a description page. Categories +-- might not have corresponding pages, so they need to be tracked separately. +-- +CREATE TABLE /*_*/category ( + -- Primary key + cat_id int NOT NULL PRIMARY KEY IDENTITY, + + -- Name of the category, in the same form as page_title (with underscores). + -- If there is a category page corresponding to this category, by definition, + -- it has this name (in the Category namespace). + cat_title nvarchar(255) NOT NULL, + + -- The numbers of member pages (including categories and media), subcatego- + -- ries, and Image: namespace members, respectively. These are signed to + -- make underflow more obvious. We make the first number include the second + -- two for better sorting: subtracting for display is easy, adding for order- + -- ing is not. + cat_pages int NOT NULL default 0, + cat_subcats int NOT NULL default 0, + cat_files int NOT NULL default 0 +); + +CREATE UNIQUE INDEX /*i*/cat_title ON /*_*/category (cat_title); + +-- For Special:Mostlinkedcategories +CREATE INDEX /*i*/cat_pages ON /*_*/category (cat_pages); + + +-- +-- Track links to external URLs +-- +CREATE TABLE /*_*/externallinks ( + -- Primary key + el_id int NOT NULL PRIMARY KEY IDENTITY, + + -- page_id of the referring page + el_from int NOT NULL REFERENCES /*_*/page(page_id) ON DELETE CASCADE, + + -- The URL + el_to nvarchar(max) NOT NULL, + + -- In the case of HTTP URLs, this is the URL with any username or password + -- removed, and with the labels in the hostname reversed and converted to + -- lower case. An extra dot is added to allow for matching of either + -- example.com or *.example.com in a single scan. + -- Example: + -- http://user:password@sub.example.com/page.html + -- becomes + -- http://com.example.sub./page.html + -- which allows for fast searching for all pages under example.com with the + -- clause: + -- WHERE el_index LIKE 'http://com.example.%' + el_index nvarchar(450) NOT NULL, + + -- This is el_index truncated to 60 bytes to allow for sortable queries that + -- aren't supported by a partial index. + -- @todo Drop the default once this is deployed everywhere and code is populating it. + el_index_60 varbinary(60) NOT NULL default '' +); + +CREATE INDEX /*i*/el_from ON /*_*/externallinks (el_from); +CREATE INDEX /*i*/el_index ON /*_*/externallinks (el_index); +CREATE INDEX /*i*/el_index_60 ON /*_*/externallinks (el_index_60, el_id); +CREATE INDEX /*i*/el_from_index_60 ON /*_*/externallinks (el_from, el_index_60, el_id); +-- el_to index intentionally not added; we cannot index nvarchar(max) columns, +-- but we also cannot restrict el_to to a smaller column size as the external +-- link may be larger. + +-- +-- Track interlanguage links +-- +CREATE TABLE /*_*/langlinks ( + -- page_id of the referring page + ll_from int NOT NULL REFERENCES /*_*/page(page_id) ON DELETE CASCADE, + + -- Language code of the target + ll_lang nvarchar(20) NOT NULL default '', + + -- Title of the target, including namespace + ll_title nvarchar(255) NOT NULL default '' +); + +CREATE UNIQUE INDEX /*i*/ll_from ON /*_*/langlinks (ll_from, ll_lang); +CREATE INDEX /*i*/ll_lang ON /*_*/langlinks (ll_lang, ll_title); + + +-- +-- Track inline interwiki links +-- +CREATE TABLE /*_*/iwlinks ( + -- page_id of the referring page + iwl_from int NOT NULL REFERENCES /*_*/page(page_id) ON DELETE CASCADE, + + -- Interwiki prefix code of the target + iwl_prefix nvarchar(20) NOT NULL default '', + + -- Title of the target, including namespace + iwl_title nvarchar(255) NOT NULL default '' +); + +CREATE UNIQUE INDEX /*i*/iwl_from ON /*_*/iwlinks (iwl_from, iwl_prefix, iwl_title); +CREATE INDEX /*i*/iwl_prefix_title_from ON /*_*/iwlinks (iwl_prefix, iwl_title, iwl_from); +CREATE INDEX /*i*/iwl_prefix_from_title ON /*_*/iwlinks (iwl_prefix, iwl_from, iwl_title); + + +-- +-- Contains a single row with some aggregate info +-- on the state of the site. +-- +CREATE TABLE /*_*/site_stats ( + -- The single row should contain 1 here. + ss_row_id int NOT NULL CONSTRAINT /*i*/ss_row_id PRIMARY KEY, + + -- Total number of edits performed. + ss_total_edits bigint default NULL, + + -- See SiteStatsInit::articles(). + ss_good_articles bigint default NULL, + + -- Total pages, theoretically equal to SELECT COUNT(*) FROM page. + ss_total_pages bigint default NULL, + + -- Number of users, theoretically equal to SELECT COUNT(*) FROM user. + ss_users bigint default NULL, + + -- Number of users that still edit. + ss_active_users bigint default NULL, + + -- Number of images, equivalent to SELECT COUNT(*) FROM image. + ss_images bigint default NULL +); + + +-- +-- The internet is full of jerks, alas. Sometimes it's handy +-- to block a vandal or troll account. +-- +CREATE TABLE /*_*/ipblocks ( + -- Primary key, introduced for privacy. + ipb_id int NOT NULL PRIMARY KEY IDENTITY, + + -- Blocked IP address in dotted-quad form or user name. + ipb_address nvarchar(255) NOT NULL, + + -- Blocked user ID or 0 for IP blocks. + ipb_user int REFERENCES /*_*/mwuser(user_id), + + -- User ID who made the block. + ipb_by int REFERENCES /*_*/mwuser(user_id) ON DELETE CASCADE, + + -- Actor ID who made the block. + ipb_by_actor bigint unsigned NOT NULL CONSTRAINT DF_ipb_by_actor DEFAULT 0, + + -- User name of blocker + ipb_by_text nvarchar(255) NOT NULL default '', + + -- Text comment made by blocker. + ipb_reason nvarchar(255) NOT NULL CONSTRAINT DF_ipb_reason DEFAULT '', + + -- Key to comment_id. Text comment made by blocker. + -- ("DEFAULT 0" is temporary, signaling that ipb_reason should be used) + ipb_reason_id bigint unsigned NOT NULL CONSTRAINT DF_ipb_reason_id DEFAULT 0 CONSTRAINT FK_ipb_reason_id FOREIGN KEY REFERENCES /*_*/comment(comment_id), + + -- Creation (or refresh) date in standard YMDHMS form. + -- IP blocks expire automatically. + ipb_timestamp varchar(14) NOT NULL default '', + + -- Indicates that the IP address was banned because a banned + -- user accessed a page through it. If this is 1, ipb_address + -- will be hidden, and the block identified by block ID number. + ipb_auto bit NOT NULL default 0, + + -- If set to 1, block applies only to logged-out users + ipb_anon_only bit NOT NULL default 0, + + -- Block prevents account creation from matching IP addresses + ipb_create_account bit NOT NULL default 1, + + -- Block triggers autoblocks + ipb_enable_autoblock bit NOT NULL default 1, + + -- Time at which the block will expire. + -- May be "infinity" + ipb_expiry varchar(14) NOT NULL, + + -- Start and end of an address range, in hexadecimal + -- Size chosen to allow IPv6 + -- FIXME: these fields were originally blank for single-IP blocks, + -- but now they are populated. No migration was ever done. They + -- should be fixed to be blank again for such blocks (T51504). + ipb_range_start varchar(255) NOT NULL, + ipb_range_end varchar(255) NOT NULL, + + -- Flag for entries hidden from users and Sysops + ipb_deleted bit NOT NULL default 0, + + -- Block prevents user from accessing Special:Emailuser + ipb_block_email bit NOT NULL default 0, + + -- Block allows user to edit their own talk page + ipb_allow_usertalk bit NOT NULL default 0, + + -- ID of the block that caused this block to exist + -- Autoblocks set this to the original block + -- so that the original block being deleted also + -- deletes the autoblocks + ipb_parent_block_id int default NULL REFERENCES /*_*/ipblocks(ipb_id) + +); + +-- Unique index to support "user already blocked" messages +-- Any new options which prevent collisions should be included +CREATE UNIQUE INDEX /*i*/ipb_address ON /*_*/ipblocks (ipb_address, ipb_user, ipb_auto, ipb_anon_only); + +CREATE INDEX /*i*/ipb_user ON /*_*/ipblocks (ipb_user); +CREATE INDEX /*i*/ipb_range ON /*_*/ipblocks (ipb_range_start, ipb_range_end); +CREATE INDEX /*i*/ipb_timestamp ON /*_*/ipblocks (ipb_timestamp); +CREATE INDEX /*i*/ipb_expiry ON /*_*/ipblocks (ipb_expiry); +CREATE INDEX /*i*/ipb_parent_block_id ON /*_*/ipblocks (ipb_parent_block_id); + + +-- +-- Uploaded images and other files. +-- +CREATE TABLE /*_*/image ( + -- Filename. + -- This is also the title of the associated description page, + -- which will be in namespace 6 (NS_FILE). + img_name nvarchar(255) NOT NULL default '' PRIMARY KEY, + + -- File size in bytes. + img_size int NOT NULL default 0, + + -- For images, size in pixels. + img_width int NOT NULL default 0, + img_height int NOT NULL default 0, + + -- Extracted Exif metadata stored as a serialized PHP array. + img_metadata varbinary(max) NOT NULL, + + -- For images, bits per pixel if known. + img_bits int NOT NULL default 0, + + -- Media type as defined by the MEDIATYPE_xxx constants + img_media_type varchar(16) default null, + + -- major part of a MIME media type as defined by IANA + -- see https://www.iana.org/assignments/media-types/ + img_major_mime varchar(16) not null default 'unknown', + + -- minor part of a MIME media type as defined by IANA + -- the minor parts are not required to adher to any standard + -- but should be consistent throughout the database + -- see https://www.iana.org/assignments/media-types/ + img_minor_mime nvarchar(100) NOT NULL default 'unknown', + + -- Description field as entered by the uploader. + -- This is displayed in image upload history and logs. + img_description nvarchar(255) NOT NULL CONSTRAINT DF_img_description DEFAULT '', + img_description_id bigint NOT NULL CONSTRAINT DF_img_description_id DEFAULT 0 CONSTRAINT FK_img_description_id FOREIGN KEY REFERENCES /*_*/comment(comment_id), + + -- user_id and user_name of uploader. + img_user int REFERENCES /*_*/mwuser(user_id) ON DELETE SET NULL, + img_user_text nvarchar(255) NOT NULL CONSTRAINT DF_img_user_text DEFAULT '', + img_actor bigint unsigned NOT NULL CONSTRAINT DF_img_actor DEFAULT 0, + + -- Time of the upload. + img_timestamp nvarchar(14) NOT NULL default '', + + -- SHA-1 content hash in base-36 + img_sha1 nvarchar(32) NOT NULL default '', + + CONSTRAINT img_major_mime_ckc check (img_major_mime IN('unknown', 'application', 'audio', 'image', 'text', 'video', 'message', 'model', 'multipart', 'chemical')), + CONSTRAINT img_media_type_ckc check (img_media_type in('UNKNOWN', 'BITMAP', 'DRAWING', 'AUDIO', 'VIDEO', 'MULTIMEDIA', 'OFFICE', 'TEXT', 'EXECUTABLE', 'ARCHIVE','3D')) +); + +CREATE INDEX /*i*/img_usertext_timestamp ON /*_*/image (img_user_text,img_timestamp); +CREATE INDEX /*i*/img_actor_timestamp ON /*_*/image (img_actor, img_timestamp); +-- Used by Special:ListFiles for sort-by-size +CREATE INDEX /*i*/img_size ON /*_*/image (img_size); +-- Used by Special:Newimages and Special:ListFiles +CREATE INDEX /*i*/img_timestamp ON /*_*/image (img_timestamp); +-- Used in API and duplicate search +CREATE INDEX /*i*/img_sha1 ON /*_*/image (img_sha1); +-- Used to get media of one type +CREATE INDEX /*i*/img_media_mime ON /*_*/image (img_media_type,img_major_mime,img_minor_mime); + +-- +-- Temporary table to avoid blocking on an alter of image. +-- +-- On large wikis like Wikimedia Commons, altering the image table is a +-- months-long process. This table is being created to avoid such an alter, and +-- will be merged back into image in the future. +-- +CREATE TABLE /*_*/image_comment_temp ( + imgcomment_name nvarchar(255) NOT NULL CONSTRAINT FK_imgcomment_name FOREIGN KEY REFERENCES /*_*/image(imgcomment_name) ON DELETE CASCADE, + imgcomment_description_id bigint unsigned NOT NULL CONSTRAINT FK_imgcomment_description_id FOREIGN KEY REFERENCES /*_*/comment(comment_id), + CONSTRAINT PK_image_comment_temp PRIMARY KEY (imgcomment_name, imgcomment_description_id) +); +CREATE UNIQUE INDEX /*i*/imgcomment_name ON /*_*/image_comment_temp (imgcomment_name); + + +-- +-- Previous revisions of uploaded files. +-- Awkwardly, image rows have to be moved into +-- this table at re-upload time. +-- +CREATE TABLE /*_*/oldimage ( + -- Base filename: key to image.img_name + -- Not a FK because deleting images removes them from image + oi_name nvarchar(255) NOT NULL default '', + + -- Filename of the archived file. + -- This is generally a timestamp and '!' prepended to the base name. + oi_archive_name nvarchar(255) NOT NULL default '', + + -- Other fields as in image... + oi_size int NOT NULL default 0, + oi_width int NOT NULL default 0, + oi_height int NOT NULL default 0, + oi_bits int NOT NULL default 0, + oi_description nvarchar(255) NOT NULL CONSTRAINT DF_oi_description DEFAULT '', + oi_description_id bigint unsigned NOT NULL CONSTRAINT DF_oi_description_id DEFAULT 0 CONSTRAINT FK_oi_description_id FOREIGN KEY REFERENCES /*_*/comment(comment_id), + oi_user int REFERENCES /*_*/mwuser(user_id), + oi_user_text nvarchar(255) NOT NULL CONSTRAINT DF_oi_user_text DEFAULT '', + oi_actor bigint unsigned NOT NULL CONSTRAINT DF_oi_actor DEFAULT 0, + oi_timestamp varchar(14) NOT NULL default '', + + oi_metadata varbinary(max) NOT NULL, + oi_media_type varchar(16) default null, + oi_major_mime varchar(16) not null default 'unknown', + oi_minor_mime nvarchar(100) NOT NULL default 'unknown', + oi_deleted tinyint NOT NULL default 0, + oi_sha1 nvarchar(32) NOT NULL default '', + + CONSTRAINT oi_major_mime_ckc check (oi_major_mime IN('unknown', 'application', 'audio', 'image', 'text', 'video', 'message', 'model', 'multipart', 'chemical')), + CONSTRAINT oi_media_type_ckc check (oi_media_type IN('UNKNOWN', 'BITMAP', 'DRAWING', 'AUDIO', 'VIDEO', 'MULTIMEDIA', 'OFFICE', 'TEXT', 'EXECUTABLE', 'ARCHIVE','3D')) +); + +CREATE INDEX /*i*/oi_usertext_timestamp ON /*_*/oldimage (oi_user_text,oi_timestamp); +CREATE INDEX /*i*/oi_actor_timestamp ON /*_*/oldimage (oi_actor,oi_timestamp); +CREATE INDEX /*i*/oi_name_timestamp ON /*_*/oldimage (oi_name,oi_timestamp); +CREATE INDEX /*i*/oi_sha1 ON /*_*/oldimage (oi_sha1); + + +-- +-- Record of deleted file data +-- +CREATE TABLE /*_*/filearchive ( + -- Unique row id + fa_id int NOT NULL PRIMARY KEY IDENTITY, + + -- Original base filename; key to image.img_name, page.page_title, etc + fa_name nvarchar(255) NOT NULL default '', + + -- Filename of archived file, if an old revision + fa_archive_name nvarchar(255) default '', + + -- Which storage bin (directory tree or object store) the file data + -- is stored in. Should be 'deleted' for files that have been deleted; + -- any other bin is not yet in use. + fa_storage_group nvarchar(16), + + -- SHA-1 of the file contents plus extension, used as a key for storage. + -- eg 8f8a562add37052a1848ff7771a2c515db94baa9.jpg + -- + -- If NULL, the file was missing at deletion time or has been purged + -- from the archival storage. + fa_storage_key nvarchar(64) default '', + + -- Deletion information, if this file is deleted. + fa_deleted_user int, + fa_deleted_timestamp varchar(14) default '', + fa_deleted_reason nvarchar(max) CONSTRAINT DF_fa_deleted_reason DEFAULT '', + fa_deleted_reason_id bigint unsigned NOT NULL CONSTRAINT DF_fa_deleted_reason_id DEFAULT 0 CONSTRAINT FK_fa_deleted_reason_id FOREIGN KEY REFERENCES /*_*/comment(comment_id), + + -- Duped fields from image + fa_size int default 0, + fa_width int default 0, + fa_height int default 0, + fa_metadata varbinary(max), + fa_bits int default 0, + fa_media_type varchar(16) default null, + fa_major_mime varchar(16) not null default 'unknown', + fa_minor_mime nvarchar(100) default 'unknown', + fa_description nvarchar(255) CONSTRAINT DF_fa_description DEFAULT '', + fa_description_id bigint unsigned NOT NULL CONSTRAINT DF_fa_description DEFAULT 0 CONSTRAINT FK_fa_description FOREIGN KEY REFERENCES /*_*/comment(comment_id), + fa_user int default 0 REFERENCES /*_*/mwuser(user_id) ON DELETE SET NULL, + fa_user_text nvarchar(255) CONSTRAINT DF_fa_user_text DEFAULT '', + fa_actor bigint unsigned NOT NULL CONSTRAINT DF_fa_actor DEFAULT 0, + fa_timestamp varchar(14) default '', + + -- Visibility of deleted revisions, bitfield + fa_deleted tinyint NOT NULL default 0, + + -- sha1 hash of file content + fa_sha1 nvarchar(32) NOT NULL default '', + + CONSTRAINT fa_major_mime_ckc check (fa_major_mime in('unknown', 'application', 'audio', 'image', 'text', 'video', 'message', 'model', 'multipart', 'chemical')), + CONSTRAINT fa_media_type_ckc check (fa_media_type in('UNKNOWN', 'BITMAP', 'DRAWING', 'AUDIO', 'VIDEO', 'MULTIMEDIA', 'OFFICE', 'TEXT', 'EXECUTABLE', 'ARCHIVE','3D')) +); + +-- pick out by image name +CREATE INDEX /*i*/fa_name ON /*_*/filearchive (fa_name, fa_timestamp); +-- pick out dupe files +CREATE INDEX /*i*/fa_storage_group ON /*_*/filearchive (fa_storage_group, fa_storage_key); +-- sort by deletion time +CREATE INDEX /*i*/fa_deleted_timestamp ON /*_*/filearchive (fa_deleted_timestamp); +-- sort by uploader +CREATE INDEX /*i*/fa_user_timestamp ON /*_*/filearchive (fa_user_text,fa_timestamp); +CREATE INDEX /*i*/fa_actor_timestamp ON /*_*/filearchive (fa_actor,fa_timestamp); +-- find file by sha1, 10 bytes will be enough for hashes to be indexed +CREATE INDEX /*i*/fa_sha1 ON /*_*/filearchive (fa_sha1); + + +-- +-- Store information about newly uploaded files before they're +-- moved into the actual filestore +-- +CREATE TABLE /*_*/uploadstash ( + us_id int NOT NULL PRIMARY KEY IDENTITY, + + -- the user who uploaded the file. + us_user int REFERENCES /*_*/mwuser(user_id) ON DELETE SET NULL, + + -- file key. this is how applications actually search for the file. + -- this might go away, or become the primary key. + us_key nvarchar(255) NOT NULL, + + -- the original path + us_orig_path nvarchar(255) NOT NULL, + + -- the temporary path at which the file is actually stored + us_path nvarchar(255) NOT NULL, + + -- which type of upload the file came from (sometimes) + us_source_type nvarchar(50), + + -- the date/time on which the file was added + us_timestamp varchar(14) NOT NULL, + + us_status nvarchar(50) NOT NULL, + + -- chunk counter starts at 0, current offset is stored in us_size + us_chunk_inx int NULL, + + -- Serialized file properties from FSFile::getProps() + us_props nvarchar(max), + + -- file size in bytes + us_size int NOT NULL, + -- this hash comes from FSFile::getSha1Base36(), and is 31 characters + us_sha1 nvarchar(31) NOT NULL, + us_mime nvarchar(255), + -- Media type as defined by the MEDIATYPE_xxx constants, should duplicate definition in the image table + us_media_type varchar(16) default null, + -- image-specific properties + us_image_width int, + us_image_height int, + us_image_bits smallint, + + CONSTRAINT us_media_type_ckc check (us_media_type in('UNKNOWN', 'BITMAP', 'DRAWING', 'AUDIO', 'VIDEO', 'MULTIMEDIA', 'OFFICE', 'TEXT', 'EXECUTABLE', 'ARCHIVE', '3D')) +); + +-- sometimes there's a delete for all of a user's stuff. +CREATE INDEX /*i*/us_user ON /*_*/uploadstash (us_user); +-- pick out files by key, enforce key uniqueness +CREATE UNIQUE INDEX /*i*/us_key ON /*_*/uploadstash (us_key); +-- the abandoned upload cleanup script needs this +CREATE INDEX /*i*/us_timestamp ON /*_*/uploadstash (us_timestamp); + + +-- +-- Primarily a summary table for Special:Recentchanges, +-- this table contains some additional info on edits from +-- the last few days, see Article::editUpdates() +-- +CREATE TABLE /*_*/recentchanges ( + rc_id int NOT NULL CONSTRAINT recentchanges__pk PRIMARY KEY IDENTITY, + rc_timestamp varchar(14) not null default '', + + -- As in revision + rc_user int NOT NULL default 0 CONSTRAINT rc_user__user_id__fk FOREIGN KEY REFERENCES /*_*/mwuser(user_id), + rc_user_text nvarchar(255) NOT NULL CONSTRAINT DF_rc_user_text DEFAULT '', + rc_actor bigint unsigned NOT NULL CONSTRAINT DF_rc_actor DEFAULT 0, + + -- When pages are renamed, their RC entries do _not_ change. + rc_namespace int NOT NULL default 0, + rc_title nvarchar(255) NOT NULL default '', + + -- as in revision... + rc_comment nvarchar(255) NOT NULL default '', + rc_comment_id bigint unsigned NOT NULL CONSTRAINT DF_rc_comment_id DEFAULT 0 CONSTRAINT FK_rc_comment_id FOREIGN KEY REFERENCES /*_*/comment(comment_id), + rc_minor bit NOT NULL default 0, + + -- Edits by user accounts with the 'bot' rights key are + -- marked with a 1 here, and will be hidden from the + -- default view. + rc_bot bit NOT NULL default 0, + + -- Set if this change corresponds to a page creation + rc_new bit NOT NULL default 0, + + -- Key to page_id (was cur_id prior to 1.5). + -- This will keep links working after moves while + -- retaining the at-the-time name in the changes list. + rc_cur_id int, -- NOT FK + + -- rev_id of the given revision + rc_this_oldid int, -- NOT FK + + -- rev_id of the prior revision, for generating diff links. + rc_last_oldid int, -- NOT FK + + -- The type of change entry (RC_EDIT,RC_NEW,RC_LOG,RC_EXTERNAL) + rc_type tinyint NOT NULL default 0, + + -- The source of the change entry (replaces rc_type) + -- default of '' is temporary, needed for initial migration + rc_source nvarchar(16) not null default '', + + -- If the Recent Changes Patrol option is enabled, + -- users may mark edits as having been reviewed to + -- remove a warning flag on the RC list. + -- A value of 1 indicates the page has been reviewed manually. + -- A value of 2 indicates the page has been automatically reviewed. + rc_patrolled tinyint NOT NULL CONSTRAINT DF_rc_patrolled DEFAULT 0, + + -- Recorded IP address the edit was made from, if the + -- $wgPutIPinRC option is enabled. + rc_ip nvarchar(40) NOT NULL default '', + + -- Text length in characters before + -- and after the edit + rc_old_len int, + rc_new_len int, + + -- Visibility of recent changes items, bitfield + rc_deleted tinyint NOT NULL default 0, + + -- Value corresponding to log_id, specific log entries + rc_logid int, -- FK added later + -- Store log type info here, or null + rc_log_type nvarchar(255) NULL default NULL, + -- Store log action or null + rc_log_action nvarchar(255) NULL default NULL, + -- Log params + rc_params nvarchar(max) NULL +); + +CREATE INDEX /*i*/rc_timestamp ON /*_*/recentchanges (rc_timestamp); +CREATE INDEX /*i*/rc_namespace_title_timestamp ON /*_*/recentchanges (rc_namespace, rc_title, rc_timestamp); +CREATE INDEX /*i*/rc_cur_id ON /*_*/recentchanges (rc_cur_id); +CREATE INDEX /*i*/new_name_timestamp ON /*_*/recentchanges (rc_new,rc_namespace,rc_timestamp); +CREATE INDEX /*i*/rc_ip ON /*_*/recentchanges (rc_ip); +CREATE INDEX /*i*/rc_ns_usertext ON /*_*/recentchanges (rc_namespace, rc_user_text); +CREATE INDEX /*i*/rc_user_text ON /*_*/recentchanges (rc_user_text, rc_timestamp); +CREATE INDEX /*i*/rc_ns_actor ON /*_*/recentchanges (rc_namespace, rc_actor); +CREATE INDEX /*i*/rc_actor ON /*_*/recentchanges (rc_actor, rc_timestamp); +CREATE INDEX /*i*/rc_name_type_patrolled_timestamp ON /*_*/recentchanges (rc_namespace, rc_type, rc_patrolled, rc_timestamp); + + +CREATE TABLE /*_*/watchlist ( + wl_id int NOT NULL PRIMARY KEY IDENTITY, + -- Key to user.user_id + wl_user int NOT NULL REFERENCES /*_*/mwuser(user_id) ON DELETE CASCADE, + + -- Key to page_namespace/page_title + -- Note that users may watch pages which do not exist yet, + -- or existed in the past but have been deleted. + wl_namespace int NOT NULL default 0, + wl_title nvarchar(255) NOT NULL default '', + + -- Timestamp used to send notification e-mails and show "updated since last visit" markers on + -- history and recent changes / watchlist. Set to NULL when the user visits the latest revision + -- of the page, which means that they should be sent an e-mail on the next change. + wl_notificationtimestamp varchar(14) + +); + +CREATE UNIQUE INDEX /*i*/wl_user ON /*_*/watchlist (wl_user, wl_namespace, wl_title); +CREATE INDEX /*i*/namespace_title ON /*_*/watchlist (wl_namespace, wl_title); + + +-- +-- Our search index for the builtin MediaWiki search +-- +CREATE TABLE /*_*/searchindex ( + -- Key to page_id + si_page int NOT NULL REFERENCES /*_*/page(page_id) ON DELETE CASCADE, + + -- Munged version of title + si_title nvarchar(255) NOT NULL default '', + + -- Munged version of body text + si_text nvarchar(max) NOT NULL +); + +CREATE UNIQUE INDEX /*i*/si_page ON /*_*/searchindex (si_page); +-- Fulltext index is defined in MssqlInstaller.php + +-- +-- Recognized interwiki link prefixes +-- +CREATE TABLE /*_*/interwiki ( + -- The interwiki prefix, (e.g. "Meatball", or the language prefix "de") + iw_prefix nvarchar(32) NOT NULL, + + -- The URL of the wiki, with "$1" as a placeholder for an article name. + -- Any spaces in the name will be transformed to underscores before + -- insertion. + iw_url nvarchar(max) NOT NULL, + + -- The URL of the file api.php + iw_api nvarchar(max) NOT NULL, + + -- The name of the database (for a connection to be established with wfGetLB( 'wikiid' )) + iw_wikiid nvarchar(64) NOT NULL, + + -- A boolean value indicating whether the wiki is in this project + -- (used, for example, to detect redirect loops) + iw_local bit NOT NULL, + + -- Boolean value indicating whether interwiki transclusions are allowed. + iw_trans bit NOT NULL default 0 +); + +CREATE UNIQUE INDEX /*i*/iw_prefix ON /*_*/interwiki (iw_prefix); + + +-- +-- Used for caching expensive grouped queries +-- +CREATE TABLE /*_*/querycache ( + -- A key name, generally the base name of of the special page. + qc_type nvarchar(32) NOT NULL, + + -- Some sort of stored value. Sizes, counts... + qc_value int NOT NULL default 0, + + -- Target namespace+title + qc_namespace int NOT NULL default 0, + qc_title nvarchar(255) NOT NULL default '' +); + +CREATE INDEX /*i*/qc_type ON /*_*/querycache (qc_type,qc_value); + + +-- +-- For a few generic cache operations if not using Memcached +-- +CREATE TABLE /*_*/objectcache ( + keyname nvarchar(255) NOT NULL default '' PRIMARY KEY, + value varbinary(max), + exptime varchar(14) +); +CREATE INDEX /*i*/exptime ON /*_*/objectcache (exptime); + + +-- +-- Cache of interwiki transclusion +-- +CREATE TABLE /*_*/transcache ( + tc_url nvarchar(255) NOT NULL, + tc_contents nvarchar(max), + tc_time varchar(14) NOT NULL +); + +CREATE UNIQUE INDEX /*i*/tc_url_idx ON /*_*/transcache (tc_url); + + +CREATE TABLE /*_*/logging ( + -- Log ID, for referring to this specific log entry, probably for deletion and such. + log_id int NOT NULL PRIMARY KEY IDENTITY(0,1), + + -- Symbolic keys for the general log type and the action type + -- within the log. The output format will be controlled by the + -- action field, but only the type controls categorization. + log_type nvarchar(32) NOT NULL default '', + log_action nvarchar(32) NOT NULL default '', + + -- Timestamp. Duh. + log_timestamp varchar(14) NOT NULL default '', + + -- The user who performed this action; key to user_id + log_user int, -- NOT an FK, if a user is deleted we still want to maintain a record of who did a thing + + -- Name of the user who performed this action + log_user_text nvarchar(255) NOT NULL default '', + + -- The actor who performed this action + log_actor bigint unsigned NOT NULL CONSTRAINT DF_log_actor DEFAULT 0, + + -- Key to the page affected. Where a user is the target, + -- this will point to the user page. + log_namespace int NOT NULL default 0, + log_title nvarchar(255) NOT NULL default '', + log_page int NULL, -- NOT an FK, logging entries are inserted for deleted pages which still reference the deleted page ids + + -- Freeform text. Interpreted as edit history comments. + log_comment nvarchar(255) NOT NULL default '', + + -- Key to comment_id. Comment summarizing the change. + -- ("DEFAULT 0" is temporary, signaling that log_comment should be used) + log_comment_id bigint unsigned NOT NULL CONSTRAINT DF_log_comment_id DEFAULT 0 CONSTRAINT FK_log_comment_id FOREIGN KEY REFERENCES /*_*/comment(comment_id), + + -- miscellaneous parameters: + -- LF separated list (old system) or serialized PHP array (new system) + log_params nvarchar(max) NOT NULL, + + -- rev_deleted for logs + log_deleted tinyint NOT NULL default 0 +); + +CREATE INDEX /*i*/type_time ON /*_*/logging (log_type, log_timestamp); +CREATE INDEX /*i*/user_time ON /*_*/logging (log_user, log_timestamp); +CREATE INDEX /*i*/page_time ON /*_*/logging (log_namespace, log_title, log_timestamp); +CREATE INDEX /*i*/times ON /*_*/logging (log_timestamp); +CREATE INDEX /*i*/log_user_type_time ON /*_*/logging (log_user, log_type, log_timestamp); +CREATE INDEX /*i*/log_page_id_time ON /*_*/logging (log_page,log_timestamp); +CREATE INDEX /*i*/type_action ON /*_*/logging (log_type, log_action, log_timestamp); +CREATE INDEX /*i*/log_user_text_type_time ON /*_*/logging (log_user_text, log_type, log_timestamp); +CREATE INDEX /*i*/log_user_text_time ON /*_*/logging (log_user_text, log_timestamp); +CREATE INDEX /*i*/actor_time ON /*_*/logging (log_actor, log_timestamp); +CREATE INDEX /*i*/log_actor_type_time ON /*_*/logging (log_actor, log_type, log_timestamp); + +INSERT INTO /*_*/logging (log_user,log_page,log_params) VALUES(0,0,''); + +ALTER TABLE /*_*/recentchanges ADD CONSTRAINT rc_logid__log_id__fk FOREIGN KEY (rc_logid) REFERENCES /*_*/logging(log_id) ON DELETE CASCADE; + +CREATE TABLE /*_*/log_search ( + -- The type of ID (rev ID, log ID, rev timestamp, username) + ls_field nvarchar(32) NOT NULL, + -- The value of the ID + ls_value nvarchar(255) NOT NULL, + -- Key to log_id + ls_log_id int REFERENCES /*_*/logging(log_id) ON DELETE CASCADE +); +CREATE UNIQUE INDEX /*i*/ls_field_val ON /*_*/log_search (ls_field,ls_value,ls_log_id); +CREATE INDEX /*i*/ls_log_id ON /*_*/log_search (ls_log_id); + + +-- Jobs performed by parallel apache threads or a command-line daemon +CREATE TABLE /*_*/job ( + job_id int NOT NULL PRIMARY KEY IDENTITY, + + -- Command name + -- Limited to 60 to prevent key length overflow + job_cmd nvarchar(60) NOT NULL default '', + + -- Namespace and title to act on + -- Should be 0 and '' if the command does not operate on a title + job_namespace int NOT NULL, + job_title nvarchar(255) NOT NULL, + + -- Timestamp of when the job was inserted + -- NULL for jobs added before addition of the timestamp + job_timestamp nvarchar(14) NULL default NULL, + + -- Any other parameters to the command + -- Stored as a PHP serialized array, or an empty string if there are no parameters + job_params nvarchar(max) NOT NULL, + + -- Random, non-unique, number used for job acquisition (for lock concurrency) + job_random int NOT NULL default 0, + + -- The number of times this job has been locked + job_attempts int NOT NULL default 0, + + -- Field that conveys process locks on rows via process UUIDs + job_token nvarchar(32) NOT NULL default '', + + -- Timestamp when the job was locked + job_token_timestamp varchar(14) NULL default NULL, + + -- Base 36 SHA1 of the job parameters relevant to detecting duplicates + job_sha1 nvarchar(32) NOT NULL default '' +); + +CREATE INDEX /*i*/job_sha1 ON /*_*/job (job_sha1); +CREATE INDEX /*i*/job_cmd_token ON /*_*/job (job_cmd,job_token,job_random); +CREATE INDEX /*i*/job_cmd_token_id ON /*_*/job (job_cmd,job_token,job_id); +CREATE INDEX /*i*/job_cmd ON /*_*/job (job_cmd, job_namespace, job_title); +CREATE INDEX /*i*/job_timestamp ON /*_*/job (job_timestamp); + + +-- Details of updates to cached special pages +CREATE TABLE /*_*/querycache_info ( + -- Special page name + -- Corresponds to a qc_type value + qci_type nvarchar(32) NOT NULL default '', + + -- Timestamp of last update + qci_timestamp varchar(14) NOT NULL default '' +); + +CREATE UNIQUE INDEX /*i*/qci_type ON /*_*/querycache_info (qci_type); + + +-- For each redirect, this table contains exactly one row defining its target +CREATE TABLE /*_*/redirect ( + -- Key to the page_id of the redirect page + rd_from int NOT NULL REFERENCES /*_*/page(page_id) ON DELETE CASCADE, + + -- Key to page_namespace/page_title of the target page. + -- The target page may or may not exist, and due to renames + -- and deletions may refer to different page records as time + -- goes by. + rd_namespace int NOT NULL default 0, + rd_title nvarchar(255) NOT NULL default '', + rd_interwiki nvarchar(32) default NULL, + rd_fragment nvarchar(255) default NULL +); + +CREATE INDEX /*i*/rd_ns_title ON /*_*/redirect (rd_namespace,rd_title,rd_from); + + +-- Used for caching expensive grouped queries that need two links (for example double-redirects) +CREATE TABLE /*_*/querycachetwo ( + -- A key name, generally the base name of of the special page. + qcc_type nvarchar(32) NOT NULL, + + -- Some sort of stored value. Sizes, counts... + qcc_value int NOT NULL default 0, + + -- Target namespace+title + qcc_namespace int NOT NULL default 0, + qcc_title nvarchar(255) NOT NULL default '', + + -- Target namespace+title2 + qcc_namespacetwo int NOT NULL default 0, + qcc_titletwo nvarchar(255) NOT NULL default '' +); + +CREATE INDEX /*i*/qcc_type ON /*_*/querycachetwo (qcc_type,qcc_value); +CREATE INDEX /*i*/qcc_title ON /*_*/querycachetwo (qcc_type,qcc_namespace,qcc_title); +CREATE INDEX /*i*/qcc_titletwo ON /*_*/querycachetwo (qcc_type,qcc_namespacetwo,qcc_titletwo); + + +-- Used for storing page restrictions (i.e. protection levels) +CREATE TABLE /*_*/page_restrictions ( + -- Field for an ID for this restrictions row (sort-key for Special:ProtectedPages) + pr_id int NOT NULL PRIMARY KEY IDENTITY, + -- Page to apply restrictions to (Foreign Key to page). + pr_page int NOT NULL REFERENCES /*_*/page(page_id) ON DELETE CASCADE, + -- The protection type (edit, move, etc) + pr_type nvarchar(60) NOT NULL, + -- The protection level (Sysop, autoconfirmed, etc) + pr_level nvarchar(60) NOT NULL, + -- Whether or not to cascade the protection down to pages transcluded. + pr_cascade bit NOT NULL, + -- Field for future support of per-user restriction. + pr_user int NULL, + -- Field for time-limited protection. + pr_expiry varchar(14) NULL +); + +CREATE UNIQUE INDEX /*i*/pr_pagetype ON /*_*/page_restrictions (pr_page,pr_type); +CREATE INDEX /*i*/pr_typelevel ON /*_*/page_restrictions (pr_type,pr_level); +CREATE INDEX /*i*/pr_level ON /*_*/page_restrictions (pr_level); +CREATE INDEX /*i*/pr_cascade ON /*_*/page_restrictions (pr_cascade); + + +-- Protected titles - nonexistent pages that have been protected +CREATE TABLE /*_*/protected_titles ( + pt_namespace int NOT NULL, + pt_title nvarchar(255) NOT NULL, + pt_user int REFERENCES /*_*/mwuser(user_id) ON DELETE SET NULL, + pt_reason nvarchar(255) CONSTRAINT DF_pt_reason DEFAULT '', + pt_reason_id bigint unsigned NOT NULL CONSTRAINT DF_pt_reason_id DEFAULT 0 CONSTRAINT FK_pt_reason_id FOREIGN KEY REFERENCES /*_*/comment(comment_id), + pt_timestamp varchar(14) NOT NULL, + pt_expiry varchar(14) NOT NULL, + pt_create_perm nvarchar(60) NOT NULL +); + +CREATE UNIQUE INDEX /*i*/pt_namespace_title ON /*_*/protected_titles (pt_namespace,pt_title); +CREATE INDEX /*i*/pt_timestamp ON /*_*/protected_titles (pt_timestamp); + + +-- Name/value pairs indexed by page_id +CREATE TABLE /*_*/page_props ( + pp_page int NOT NULL REFERENCES /*_*/page(page_id) ON DELETE CASCADE, + pp_propname nvarchar(60) NOT NULL, + pp_value nvarchar(max) NOT NULL, + pp_sortkey float DEFAULT NULL +); + +CREATE UNIQUE INDEX /*i*/pp_page_propname ON /*_*/page_props (pp_page,pp_propname); +CREATE UNIQUE INDEX /*i*/pp_propname_page ON /*_*/page_props (pp_propname,pp_page); +CREATE UNIQUE INDEX /*i*/pp_propname_sortkey_page ON /*_*/page_props (pp_propname,pp_sortkey,pp_page); + + +-- A table to log updates, one text key row per update. +CREATE TABLE /*_*/updatelog ( + ul_key nvarchar(255) NOT NULL PRIMARY KEY, + ul_value nvarchar(max) +); + + +-- A table to track tags for revisions, logs and recent changes. +CREATE TABLE /*_*/change_tag ( + ct_id int NOT NULL PRIMARY KEY IDENTITY, + -- RCID for the change + ct_rc_id int NULL REFERENCES /*_*/recentchanges(rc_id), + -- LOGID for the change + ct_log_id int NULL REFERENCES /*_*/logging(log_id), + -- REVID for the change + ct_rev_id int NULL REFERENCES /*_*/revision(rev_id), + -- Tag applied + ct_tag nvarchar(255) NOT NULL, + -- Parameters for the tag, presently unused + ct_params nvarchar(max) NULL +); + +CREATE UNIQUE INDEX /*i*/change_tag_rc_tag ON /*_*/change_tag (ct_rc_id,ct_tag); +CREATE UNIQUE INDEX /*i*/change_tag_log_tag ON /*_*/change_tag (ct_log_id,ct_tag); +CREATE UNIQUE INDEX /*i*/change_tag_rev_tag ON /*_*/change_tag (ct_rev_id,ct_tag); +-- Covering index, so we can pull all the info only out of the index. +CREATE INDEX /*i*/change_tag_tag_id ON /*_*/change_tag (ct_tag,ct_rc_id,ct_rev_id,ct_log_id); + + +-- Rollup table to pull a LIST of tags simply without ugly GROUP_CONCAT +-- that only works on MySQL 4.1+ +CREATE TABLE /*_*/tag_summary ( + ts_id int NOT NULL PRIMARY KEY IDENTITY, + -- RCID for the change + ts_rc_id int NULL REFERENCES /*_*/recentchanges(rc_id), + -- LOGID for the change + ts_log_id int NULL REFERENCES /*_*/logging(log_id), + -- REVID for the change + ts_rev_id int NULL REFERENCES /*_*/revision(rev_id), + -- Comma-separated list of tags + ts_tags nvarchar(max) NOT NULL +); + +CREATE UNIQUE INDEX /*i*/tag_summary_rc_id ON /*_*/tag_summary (ts_rc_id); +CREATE UNIQUE INDEX /*i*/tag_summary_log_id ON /*_*/tag_summary (ts_log_id); +CREATE UNIQUE INDEX /*i*/tag_summary_rev_id ON /*_*/tag_summary (ts_rev_id); + + +CREATE TABLE /*_*/valid_tag ( + vt_tag nvarchar(255) NOT NULL PRIMARY KEY +); + +-- Table for storing localisation data +CREATE TABLE /*_*/l10n_cache ( + -- Language code + lc_lang nvarchar(32) NOT NULL, + -- Cache key + lc_key nvarchar(255) NOT NULL, + -- Value + lc_value varbinary(max) NOT NULL +); +CREATE INDEX /*i*/lc_lang_key ON /*_*/l10n_cache (lc_lang, lc_key); + +-- Table caching which local files a module depends on that aren't +-- registered directly, used for fast retrieval of file dependency. +-- Currently only used for tracking images that CSS depends on +CREATE TABLE /*_*/module_deps ( + -- Module name + md_module nvarchar(255) NOT NULL, + -- Skin name + md_skin nvarchar(32) NOT NULL, + -- JSON nvarchar(max) with file dependencies + md_deps nvarchar(max) NOT NULL +); +CREATE UNIQUE INDEX /*i*/md_module_skin ON /*_*/module_deps (md_module, md_skin); + +-- Holds all the sites known to the wiki. +CREATE TABLE /*_*/sites ( + -- Numeric id of the site + site_id int NOT NULL PRIMARY KEY IDENTITY, + + -- Global identifier for the site, ie 'enwiktionary' + site_global_key nvarchar(32) NOT NULL, + + -- Type of the site, ie 'mediawiki' + site_type nvarchar(32) NOT NULL, + + -- Group of the site, ie 'wikipedia' + site_group nvarchar(32) NOT NULL, + + -- Source of the site data, ie 'local', 'wikidata', 'my-magical-repo' + site_source nvarchar(32) NOT NULL, + + -- Language code of the sites primary language. + site_language nvarchar(32) NOT NULL, + + -- Protocol of the site, ie 'http://', 'irc://', '//' + -- This field is an index for lookups and is build from type specific data in site_data. + site_protocol nvarchar(32) NOT NULL, + + -- Domain of the site in reverse order, ie 'org.mediawiki.www.' + -- This field is an index for lookups and is build from type specific data in site_data. + site_domain NVARCHAR(255) NOT NULL, + + -- Type dependent site data. + site_data nvarchar(max) NOT NULL, + + -- If site.tld/path/key:pageTitle should forward users to the page on + -- the actual site, where "key" is the local identifier. + site_forward bit NOT NULL, + + -- Type dependent site config. + -- For instance if template transclusion should be allowed if it's a MediaWiki. + site_config nvarchar(max) NOT NULL +); + +CREATE UNIQUE INDEX /*i*/sites_global_key ON /*_*/sites (site_global_key); +CREATE INDEX /*i*/sites_type ON /*_*/sites (site_type); +CREATE INDEX /*i*/sites_group ON /*_*/sites (site_group); +CREATE INDEX /*i*/sites_source ON /*_*/sites (site_source); +CREATE INDEX /*i*/sites_language ON /*_*/sites (site_language); +CREATE INDEX /*i*/sites_protocol ON /*_*/sites (site_protocol); +CREATE INDEX /*i*/sites_domain ON /*_*/sites (site_domain); +CREATE INDEX /*i*/sites_forward ON /*_*/sites (site_forward); + +-- Links local site identifiers to their corresponding site. +CREATE TABLE /*_*/site_identifiers ( + -- Key on site.site_id + si_site int NOT NULL REFERENCES /*_*/sites(site_id) ON DELETE CASCADE, + + -- local key type, ie 'interwiki' or 'langlink' + si_type nvarchar(32) NOT NULL, + + -- local key value, ie 'en' or 'wiktionary' + si_key nvarchar(32) NOT NULL +); + +CREATE UNIQUE INDEX /*i*/site_ids_type ON /*_*/site_identifiers (si_type, si_key); +CREATE INDEX /*i*/site_ids_site ON /*_*/site_identifiers (si_site); +CREATE INDEX /*i*/site_ids_key ON /*_*/site_identifiers (si_key); |