MediaWiki:ExtractFirst.xsl

<?xml version="1.0" encoding="UTF-8"?>

<xsl:stylesheet version="1.0"
xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
<xsl:output method='html'/>
<xsl:variable name="dir">ltr</xsl:variable>
<xsl:variable name="more">» Thêm nữa</xsl:variable>
<xsl:variable name="error">Lỗi: </xsl:variable>
<xsl:variable name='audio'>Cách phát âm</xsl:variable>
<xsl:variable name='audio-separator'> • </xsl:variable>
<xsl:variable name="copyright"> © <a href="http://vi.wiktionary.org/wiki/">Wiktionary</a>. Phát hành theo <a href="https://creativecommons.org/licenses/by-sa/3.0/deed.vi" rel="license copyright">CC BY-SA 3.0</a></xsl:variable>
<xsl:variable name="contentLang" select="'vi'"/>

<xsl:variable name="pageName" select="concat('http://', $contentLang, '.wiktionary.org')"/>
<xsl:template match="/">

<html dir="{$dir}" lang="{$contentLang}" xml:lang="{$contentLang}">
<head>
<meta name="generator" content="Wiktionary Extract XSLT 1.10-VI"/>
<base target='_blank' href="{$pageName}" />

<title> Wiktionary extract</title>

<style>
#wordThisIsFor { font-weight:bold;}
a.wtif1  { color: black; text-decoration: none;}
a.wtif1:hover {text-decoration: underline;}
.disambig-see-also, .disambig-see-also-2 {display:inline;}
#container {background-color:white; padding: 0.5em; border: solid black thin;}
a.new {color: red;}
#error {color: red;font-size:larger;}

div.exit {float:right;font-weight:bold;font-family:sans-serif;border:outset;padding:0.1em}
div.exit a {color: black; text-decoration:none;}
</style>
<script type='text/javascript'>
/*<![CDATA[*/
function setup () {
//Stuff to translate:
var preferLang = {'en': 'Anh', 'fr': 'Pháp', 'de': 'Đức', 'es': 'Tây Ban Nha', 'it': 'Ý', 'pt': 'Bồ Đào Nha', 'ja': 'Nhật Bản', 'pl': 'Ba Lan', 'ru': 'Nga', 'nl': 'Hà Lan', 'vi': 'Việt', 'qqqAny': null}; //for now.

var extractSeeAlso = /

[\s\S]*?<\/div>/; //no subexpressions!

var see_also_process = function (sa) {return sa;}
var createLink = '» Tạo'; // text only.
var not_found = "Không tìm thấy định nghĩa $1.";

//END stuff to translate (there is one more translation block below)

//Stuff not to translate in general (setup).

var rd = location.search.match(/\&rd\=([^&]*)/); //is this from redirect. + converts to numeric.
rd = rd ? (+rd[1] + 1) : 1; //redirection level.
var showWord = 0; //default to not showing. 0 = none, 1 = bold, 2 = bold link.
var showWordRaw = location.search.match(/\&showWord\=([^&]*)/);
showWordRaw = showWordRaw ? showWordRaw[1] : 'none';
if (showWordRaw !== "none") {
 showWord++;
}
if (showWordRaw === "link") {
 showWord++;
}
var useAudio = 0;
if (location.search.match(/\&audio\=(?!none)/)) useAudio++;
if (location.search.match(/\&audio\=autoplay/)) useAudio++;
var closeLink = false;
if (location.search.match(/&exit\=(?!false)/)) closeLink = true;
var numbDfn = location.search.match(/\&count\=([^&]*)/); //count. + converts to numeric.
numbDfn = numbDfn ? (parseInt(numbDfn[1])) : 1; //default to 1
var pageURL = '/w/index.php?title=' + encodeURIComponent(decodeURIComponent(location.search.match(/\&page\=([^&]*)/)[1]));
var src = document.getElementById('src');
var display = document.getElementById('word-list');
var loc = location.search.match(/\&page\=([^&]*)/)[1]; //this is not escaped
var escWord = decodeURIComponent(loc).replace(/&/, '&').replace(/>/, '<').replace(/</, '>');
//note: wordEsc does not escape quotes. DO NOT PUT AS ATTRIBUTE VALUE
var preferLangCode = location.search.match(/\&lang\=([^&]*)/);
if (preferLangCode) { preferLangCode = preferLangCode[1]; }
else {preferLangCode = 'qqqAny';}
src.normalize();
var html = src.firstChild.data;
var def = html //may be redefined later.

 //stuff you might need to translate, but hopefully won't

var subSectRegex = new RegExp('

[^<]*?(<span[^<]*?<a[^<]*?<\/a[^<]*?</span[^<]*?)?]*>[\\s\\S]*$'); var extractCurLangName = /]*>([\s\S]*?)<\/span>/; //first subexpression //End stuff you hopefully won't need to translate. try { //this assumes attribute order doesn't change!!! html = html.replace(/

[\s\S]*?<\/div>/, );

 if (preferLangCode && preferLang[preferLangCode]) {
  try {
   //strip off all definitions before tagret lang.
   var subSect = html.match(subSectRegex)[0];

if (subSect.match(/

/)) { //if it has content def = subSect; } } catch (e) { /*alert(e)*/} } var lang = def.match(extractCurLangName)[1]; var intro = "(" + lang + ") "; //Start testing to see if we can play audio. var audioCreditLink; var audioLink = html.match(/\<a\s*\S*?\s*href\=\"?(https?:\/\/upload.wikimedia.org\/\S*.(?:oga|ogg))\"?[^>]*>/); if (!audioLink) audioLink = html.match(/\<button[\s\S]*?\sonclick=\"[\s\S]*?"videoUrl":\s*"(https?:\/\/upload.wikimedia.org\/\S*?)"[^"]*?"isVideo":\sfalse[^"]*?".*?>/); if (audioLink) { audioCreditLink = audioLink[1].match(/\/([^\/]*)$/); if (audioCreditLink) audioCreditLink = 'File:' + audioCreditLink[1] if (useAudio > 0) { var supportsHTML5Audio = (typeof Audio !== 'undefined'); var audioAutoplay = (useAudio === 2) ? "autoplay" : ""; audioLink = encodeURI(decodeURI(audioLink[1])); //should be already encoded, but better safe. intro += ' <audio style="float:right;" controls src="' + audioLink + '" ' + audioAutoplay; + ' >'; //the cortando stuff is inspired (stolen) from oggHandler. //the object tag interferes with the audio tag on firefox for autoplay //specificly it interperts autoplay differently then mplayer does. if (!supportsHTML5Audio) { intro += '<object align="right" type="application/ogg" height="18" width="180" data="' + audioLink + '" autoplay="' + (audioAutoplay === 'autoplay') + '" >'; } intro += '<applet code="com.fluendo.player.Cortado.class" ' + ' width=180' + ' height=20' + ' archive="https://upload.wikimedia.org/jars/cortado.jar">' + ' <param name="url" value="' + audioLink + '" />' + ' <param name="seekable" value="true"/>' + ' <param name="autoPlay" value="' + (audioAutoplay === 'autoplay') + '"/>' + ' <param name="showStatus" value="show"/>' + ' <param name="showSpeaker" value="false"/>' + ' <param name="statusHeight" value="18"/>' + '
</applet>';
```
    if (!supportsHTML5Audio) {
     intro += '</object>';
    }
    intro += '</audio>';
  }
 }
```
```
 if (showWord)  intro = '<a href="' + pageURL + '" id="wordThisIsFor" class="wtif' + showWord + '" >' + escWord + "</a> " + intro ;
```
```
 var definitions_matched;
 //FIXME: in both cases the extraction method does not properly strip nested divs. This results in image thumbnails being left behind
 if (numbDfn === 1) {
```
definitions_matched = def.match(/