Módulo:Webarchive/data

Wikisource, a biblioteca livre
Documentação do módulo[ver] [editar] [histórico] [purgar]

Dados utilizados por Módulo:Webarchive.

--[[--------------------------< C O N F I G U R A T I O N >----------------------------------------------------

global configuration settings

]]

local config = {
    maxurls = 10,                                                                -- Max number of URLs allowed.
    tname = 'Webarchive',                                                        -- name of calling template. Change if template rename.
    verifydates = true,                                                            -- See documentation. Set false to disable.
    }


--[[--------------------------< U N C A T E G O R I Z E D _ N A M E S P A C E S >------------------------------

List of namespaces that should not be included in citation error categories.

Note: Namespace names should use underscores instead of spaces.

]]

local uncategorized_namespaces = {                                                -- same list as specified at [[Module:Citation/CS1/Configuration]]
    ['User']=true, ['Talk']=true, ['User_talk']=true, ['Wikipedia_talk']=true, ['File_talk']=true,
    ['Template_talk']=true, ['Help_talk']=true, ['Category_talk']=true, ['Portal_talk']=true,
    ['Book_talk']=true, ['Draft_talk']=true, ['Education_Program_talk']=true, ['Module_talk']=true,
    ['MediaWiki_talk']=true,
    }

local uncategorized_subpages = {'/[Tt]estes', '/[Ee]xemplos para testes'};                -- list of Lua patterns found in page names of pages we should not categorize

local excepted_pages = {                                                        -- these pages will be categorized if set true; set to nil to disable
    ['Module talk:Webarchive/testcases'] = true,                                -- test cases pages used during development
    ['Template:Webarchive/testcases/Production'] = true,
    }


--[[--------------------------< C A T E G O R I E S >----------------------------------------------------------

this is a table of all categories supported by Module:Webarchive

]]

local categories = {
    archiveis = 'Categoria:!Predefinição Webarchive archiveis links',
    error = 'Categoria:!Erros na predefinição Webarchive',
    other = 'Categoria:!Predefinição Webarchive outros arquivos',
    unknown = 'Categoria:!Predefinições Webarchive arquivos desconhecidos',
    warning = 'Categoria:!Avisos na predefinição Webarchive',
    wayback = 'Categoria:!Predefinição Webarchive archiveis links',
    webcite = 'Categoria:!Predefinição Webarchive webcite links',
    }


--[[--------------------------< P R E F I X E S >--------------------------------------------------------------

used only with serviceName(), this table holds the two generic tail-text prefixes specified by services['<service name>'][1]

]]

local prefixes = {
    at = 'na',
    atthe = 'no',
    }


--[=[-------------------------< S E R V I C E S >--------------------------------------------------------------

this is a table of tables for archive services.  Each service table has:
    [1]=prefix; may be boolean true or false, or text string where:
        true indicates that the prefix is taken from prefixes.atthe
        false indicates that the prefix is taken from prefixes.at
        'text string' is used in lieu of the typical 'at' or 'at the' prefix
    [2]=wikilink target article that describes the service; set to nil if not used
    [3]=wikilink label; the label in [[target|label]]; set to nil if not used; when there is not article ([2] is nil) use this to name the service; see wikiwix in the table
    [4]=service ID; set to nil if not used
    [5]=tracking category key from the categories table; set to nil if not used
    [6]=postfix; text string to be appended at the end of the tail string - see webarchive.loc.gov in the table

]=]

local services = {
    ['archive.ec'] = {false, 'Archive.today', nil, 'archiveis', categories.archiveis},
    ['archive.fo'] = {false, 'Archive.today', nil, 'archiveis', categories.archiveis},
    ['archive.is'] = {false, 'Archive.today', nil, 'archiveis', categories.archiveis},
    ['archive.li'] = {false, 'Archive.today', nil, 'archiveis', categories.archiveis},
    ['archive.md'] = {false, 'Archive.today', nil, 'archiveis', categories.archiveis},
    ['archive.org'] = {true, 'Wayback Machine', nil, 'wayback', categories.wayback},
    ['archive.ph'] = {false, 'Archive.today', nil, 'archiveis', categories.archiveis},
    ['archive.today'] = {false, 'Archive.today', nil, 'archiveis', categories.archiveis},
    ['archive.vn'] = {false, 'Archive.today', nil, 'archiveis', categories.archiveis},
    ['archive-it.org'] = {false, 'Archive-It', nil, 'archiveit'},
    ['arquivo.pt'] = {true, nil, 'Portuguese Web Archive'},
    ['bibalex.org'] = {false, 'Bibliotheca Alexandrina#Internet Archive partnership', 'Bibliotheca Alexandrina'},
    ['collectionscanada'] = {true, 'Canadian Government Web Archive'},
    ['europarchive.org'] = {true, 'National Library of Ireland'},
    ['freezepage.com'] = {false, nil, 'Freezepage'},
    ['haw.nsk'] = {true, 'Croatian Web Archive (HAW)'},
    ['langzeitarchivierung.bib-bvb.de'] = {false, 'Bavarian State Library'},
    ['loc.gov'] = {true, 'Library of Congress'},
    ['nationalarchives.gov.uk'] = {true, 'UK Government Web Archive'},
    ['nlb.gov.sg'] = {false, 'Web Archive Singapore'},
    ['pandora.nla.gov.au'] = {false, 'Pandora Archive'},
    ['parliament.uk'] = {true, 'UK Parliament\'s Web Archive'},
    ['perma.cc'] = {false, 'Perma.cc'},
    ['perma-archives.cc'] = {false, 'Perma.cc'},
    ['proni.gov'] = {true, 'Public Record Office of Northern Ireland'},
    ['screenshots.com'] = {false, nil, 'Screenshots'},
    ['stanford.edu'] = {true, 'Stanford University Libraries', 'Stanford Web Archive'},
    ['timetravel.mementoweb.org'] = {false, 'Memento Project'},
    ['uni-lj.si'] = {true, nil, 'Slovenian Web Archive'},
    ['veebiarhiiv.digar.ee'] = {true, nil, 'Estonian Web Archive'},
    ['vefsafn.is'] = {true, 'National and University Library of Iceland'},
    ['webarchive.bac-lac.gc.ca'] = {false, 'Library and Archives Canada'},
    ['webarchive.loc.gov'] = {true, 'Library of Congress', nil, 'locwebarchives', nil, 'Web Archives'},
    ['webarchive.org.uk'] = {true, 'UK Web Archive'},
    ['webcache.googleusercontent.com'] = {false, nil, 'Google Cache'},
    ['webcitation.org'] = {false, 'WebCite', nil, 'webcite', categories.webcite},
    ['webharvest.gov'] = {true, 'National Archives and Records Administration'},
    ['webrecorder.io'] = {false, 'webrecorder.io'},
    ['wikiwix.com'] = {false, nil, 'Wikiwix'},
    ['yorku.ca'] = {false, 'York University Libraries', 'York University Digital Library'},
    }


--[[--------------------------< S T A T I C   T E X T >--------------------------------------------------------

for internationalzation

]]

local s_text = {
    addlarchives = 'Arquivos adicionais',
    addlpages = 'Páginas adicionais arquivadas em',                            -- TODO why the &nbsp; there? replace with regular space?
    Archive_index = 'Índice do arquivo',
    Archived = 'Arquivado',
    archived = 'arquivado',
    archive = 'arquivo',
    Page = 'Página',
    }


--[[--------------------------< E R R _ W A R N _ M S G S >----------------------------------------------------

these tables hold error and warning message text

]]

local err_warn_msgs = {
    date_err = '[Erro de data]',                                                    -- decodeWebciteDate, decodeWaybackDate, decodeArchiveisDate
    date_miss = '[Falta data]',                                                -- parseExtraArgs
    ts_short = '[Comprimento de Timestamp de data]',                                        -- decodeWaybackDate timestamp less than 8 digits
    ts_date = '[Data de Timestamp inválido]',                                        -- decodeWaybackDate timestamp not a valid date
    unknown_url = '[Erro: arquivo url desconhecido]',                                -- serviceName
    unnamed_params = '[Parâmetro posicional ignorado]',

--warnings
    mismatch = '<sup>[Data trocada]</sup>',                                    -- webarchive
    ts_len = '<sup>[Comprimento de Timestamp]</sup>',                                    -- decodeWaybackDate, decodeArchiveisDate timestamp not 14 digits
    ts_cal = '<sup>[Calendário]</sup>',                                            -- decodeWaybackDate timestamp has trailing splat
    }


local crit_err_msgs = {                                                            -- critical error messages
    conflicting = '|$1= e |$2= em conflito',
    empty = 'url vazio',
--    iabot1 = 'https://web.http',                                                -- TODO: these iabot bugs perportedly fixed; removing these causes lua script error
--    iabot2 = 'URL inválido',                                                        -- at Template:Webarchive/testcases/Production; resolve that before deleting these messages
    invalid_url = 'URL inválido',
    ts_nan = 'Timestamp não é um número',
    unknown = 'Problema desconhecido. Por favor aviso na página de discussão da predefinição',
    }



--[[--------------------------< D A T E   I N T E R N A T I O N A L I Z A T I O N >----------------------------

these tables hold data that is used when converting date formats from non-English languages (because mw.language.getContentLanguage:formatDate()
doesn't understand non-English month names)

]]

local month_num = {                                                                -- retain English language names even though they may not be strictly required on the local wiki
    ['January'] = 1, ['February'] = 2, ['March'] = 3, ['April'] = 4, ['May'] = 5, ['June'] = 6, ['July'] = 7, ['August'] = 8, ['September'] = 9, ['October'] = 10, ['November'] = 11, ['December'] = 12,
    ['Jan'] = 1, ['Feb'] = 2, ['Mar'] = 3, ['Apr'] = 4, ['May'] = 5, ['Jun'] = 6, ['Jul'] = 7, ['Aug'] = 8, ['Sep'] = 9, ['Oct'] = 10, ['Nov'] = 11, ['Dec'] = 12,
-- add local wiki month-names to number translation here
--    [''] = 1, [''] = 2, [''] = 3, [''] = 4, [''] = 5, [''] = 6, [''] = 7, [''] = 8, [''] = 9, [''] = 10, [''] = 11, [''] = 12,
    };

                                                                                -- when the local wiki uses non-western digits in dates, local wiki digits must be
                                                                                -- translated to western digits; lua only understands western digits
local digits = {                                                                -- use this table to aid translation
--    [''] = 0, [''] = 1, [''] = 2, [''] = 3, [''] = 4, [''] = 5, [''] = 6, [''] = 7, [''] = 8, [''] = 9,    -- fill these table indexes with local digits
    enable = false                                                                -- set to true to enable local-digit to western-digit translation
    };


--[[--------------------------< P A R A M E T E R   I N T E R N A T I O N A L I Z A T I O N >------------------

this table holds tables of parameter names and their non-English aliases.  In the enum_params table '#' is a single
character placeholder for 1 or more digit characters

parameter names in this table shall be lowercase
]]

local params = {
    ['url'] = {'url'},
    ['date'] = {'date', 'datum', 'data', 'wayback', 'webciteID', 'archive-today', 'archive-is' }, -- compatibilidade com webarchiv de de.wiki
    ['title'] = {'title', 'titel', 'text', 'título', 'titulo'},
    ['nolink'] = {'nolink', 'semlink'},
    ['format'] = {'format', 'formato'}
    }

local enum_params = {
    ['url#'] = {'url#'},
    ['date#'] = {'date#', 'datum#', 'data#'},
    ['title#'] = {'title#', 'titel#', 'título#', 'titulo#'},
    }

local format_vals = {                                                            -- |format= accepts two values; add local language variants here
    ['addlpages'] = {'addlpages'},
    ['addlarchives'] = {'addlarchives'},
    }


--[[--------------------------< E X P O R T E D   T A B L E S >------------------------------------------------
]]

return {
    categories = categories,
    config = config,
    crit_err_msgs = crit_err_msgs,
    digits = digits,
    enum_params = enum_params,
    err_warn_msgs = err_warn_msgs,
    excepted_pages = excepted_pages,
    format_vals = format_vals,
    month_num = month_num,
    params = params,
    prefixes = prefixes,
    services = services,
    s_text = s_text,
    uncategorized_namespaces = uncategorized_namespaces,
    uncategorized_subpages = uncategorized_subpages,
    }