MediaWiki:ExtractFirst.xsl

出典: フリー多機能辞典『ウィクショナリー日本語版(Wiktionary)』
移動先: 案内検索

<?xml version="1.0" encoding="UTF-8"?>

<xsl:stylesheet version="1.0"
xmlns:xsl="http://www.w3.org/1999/XSL/Transform">
<xsl:output method='html'/>
<xsl:variable name="dir">ltr</xsl:variable>
<xsl:variable name="more">» もっと見る</xsl:variable>
<xsl:variable name="error">エラー: </xsl:variable>
<xsl:variable name="copyright"> © <a href="http://ja.wiktionary.org/wiki/">ウィクショナリー</a>。<a href="http://creativecommons.org/licenses/by-sa/3.0/deed.ja" rel="license copyright">クリエイティブ・コモンズ 表示-継承ライセンス</a>の下で公開されています。</xsl:variable>
<xsl:variable name="contentLang" select="'ja'"/> 
<xsl:variable name="pageName" select="concat('http://', $contentLang, '.wiktionary.org')"/>
<xsl:template match="/">
<html dir="{$dir}" lang="{$contentLang}" xml:lang="{$contentLang}">
<head>
<meta name="generator" content="Wiktionary Extract XSLT 1.08-EN"/>
<base target='_blank' href="{$pageName}" />

<title> Wiktionary extract</title>

<style>
#wordThisIsFor { font-weight:bold;}
a.wtif1  { color: black; text-decoration: none;}
a.wtif1:hover {text-decoration: underline;}
.disambig-see-also, .disambig-see-also-2 {display:inline;}
#container {background-color:white; padding: 0.5em; border: solid black thin;}
a.new {color: red;}
#error {color: red;font-size:larger;}
</style>
<script type='text/javascript'>
/*<![CDATA[*/
function setup () {
//Stuff to translate:
var preferLang = {'ja': '日本語', 'en': '英語', 'fr': 'フランス語', 'de': 'ドイツ語', 'es': 'スペイン語', 'it': 'イタリア語', 'pt': 'ポルトガル語', 'pl': 'ポーランド語', 'ru': 'ロシア語', 'nl': 'オランダ語', 'qqqAny': null}; //for now.

var extractSeeAlso = /

]*?>([\s\S]*?)<\/p>/; //no subexpressions! var see_also_process = function (sa) {return sa[1];} var createLink = '» 作成する'; // text only. var not_found = "$1の語義は見つかりませんでした。"; //END stuff to translate (there is one more translation block below) //Stuff not to translate in general (setup). var rd = location.search.match(/\&rd\=([^&]*)/); //is this from redirect. + converts to numeric. rd = rd ? (+rd[1] + 1) : 1; //redirection level. var showWord = 0; //default to not showing. 0 = none, 1 = bold, 2 = bold link. var showWordRaw = location.search.match(/\&showWord\=([^&]*)/); showWordRaw = showWordRaw ? showWordRaw[1] : 'none'; if (showWordRaw !== "none") { showWord++; } if (showWordRaw === "link") { showWord++; } var numbDfn = location.search.match(/\&count\=([^&]*)/); //count. + converts to numeric. numbDfn = numbDfn ? (parseInt(numbDfn[1])) : 1; //default to 1 var pageURL = '/w/index.php?title=' + encodeURIComponent(decodeURIComponent(location.search.match(/\&page\=([^&]*)/)[1])); var src = document.getElementById('src'); var display = document.getElementById('word-list'); var loc = location.search.match(/\&page\=([^&]*)/)[1]; //this is not escaped var escWord = decodeURIComponent(loc).replace(/&/, '&').replace(/>/, '<').replace(/</, '>'); //note: wordEsc does not escape quotes. DO NOT PUT AS ATTRIBUTE VALUE var preferLangCode = location.search.match(/\&lang\=([^&]*)/); if (preferLangCode) { preferLangCode = preferLangCode[1]; } else {preferLangCode = 'qqqAny';} src.normalize(); var html = src.firstChild.data; var def = html //may be redefined later. //stuff you might need to translate, but hopefully won't var subSectRegex = new RegExp('

[^<]*?(<span[^<]*?<a[^<]*?<\/a[^<]*?</span[^<]*?)?]*>[\\s\\S]*$'); var extractCurLangName = /]*>([\s\S]*?)<\/span>/; //first subexpression //End stuff you hopefully won't need to translate. try { //this assumes attribute order doesn't change!!! html = html.replace(/

[\s\S]*?<\/div>/, );

 if (preferLangCode && preferLang[preferLangCode]) {
  try {
   //strip off all definitions before tagret lang.
   var subSect = html.match(subSectRegex)[0];

if (subSect.match(/

  1. [\s\S]*?
  2. /)) { //if it has content def = subSect; } } catch (e) { /*alert(e)*/} } var lang = def.match(extractCurLangName)[1]; var intro = "(" + lang + ") "; if (showWord) intro = '<a href="' + pageURL + '" id="wordThisIsFor" class="wtif' + showWord + '" >' + escWord + "</a> " + intro ; var definitions_matched; //FIXME: in both cases the extraction method does not properly strip nested divs. This results in image thumbnails being left behind if (numbDfn === 1) { definitions_matched = def.match(/
    [\s\S]*?<\/ol>/)[0].replace(/
    [\s\S]*?<\/dl>/g, ).replace(/<div[^>]*>[\s\S]*?<\/div>/g, ).replace(/<\/div>/g, ).replace(/
    • [\s\S]*?<\/ul>/g, ).replace(/<a href="(#[^"]*)">/g, '<a href="' + pageURL + '$1">').match(/
    • ([\s\S]*?)<\/li>/); display.innerHTML = intro + definitions_matched[1]; } else { //this use not well supported... definitions_matched = def.match(/
      [\s\S]*?<\/ol>/)[0].replace(/
      [\s\S]*?<\/dl>/g, ).replace(/<div[^>]*>[\s\S]*?<\/div>/g, ).replace(/<\/div>/g, ).replace(/
      • [\s\S]*?<\/ul>/g, ).replace(/<a href="(#[^"]*)">/g, '<a href="' + pageURL + '$1">').match(/
      • ([\s\S]*?)<\/li>/g); var tmp = intro + '
        '; for (var i = 0; i < numbDfn && i < definitions_matched.length; i++) { tmp += definitions_matched[i]; } display.innerHTML = tmp + '
        ';
         }
        }
        catch (e) {
         //alert(e)
         //page does not exist, not well formed, these regexs suck, etc
        
        
         //note, this is appending a text node, thus it is ok, that loc is not escaped.
         display.appendChild(document.createTextNode(not_found.replace("$1", decodeURIComponent(loc))));
         document.getElementById('more-link').firstChild.data = createLink;
         if (rd < 9) { //arbitrary to prevent infinite loops
          //make sure don't have loops.
          var newLoc; //this should not be urlEncoded.
          var remAlt = false;
          var dLoc = decodeURIComponent(loc);
        
        
          newLoc = dLoc.charAt(0).toLowerCase() + dLoc.substring(1, loc.length);
          //try some other redirections.
        
        
          if (newLoc === dLoc) newLoc = dLoc.toLowerCase();
          if (newLoc === dLoc && location.search.match(/\&alt\=([^&]*)/)) {
           newLoc = decodeURIComponent(location.search.match(/\&alt\=([^&]*)/)[1]);
           remAlt = true;
          }
          
          if (newLoc !== dLoc) { //redir
           var newURL = location.href.replace(/(^[\s\S]*?\&page\=)[^&]*([\s\S]*$)/, '$1'+ encodeURIComponent(newLoc) + '$2');
           newURL = newURL.replace(/&rd\=[^&]*/, ); //strip old redirect header.
           if (remAlt) {
            location.href.replace(/&alt\=[^&]*/, );
           }
           location = newURL + '&rd=' + rd;
          }
         }
        }
        var sa = html.match(extractSeeAlso);
        if(sa) {
         document.getElementById('see-also').innerHTML = ' (' + see_also_process(sa) + ')' ;
        }
        document.getElementById('more-link').href= pageURL;
        
        
        

        }

        /*]]>*/
        </script>
        
        

        </head>

        <body onload='setup()'>
        
        
        <xsl:apply-templates select='api/error'/>
        <a id='more-link'><xsl:value-of select="$more"/></a> <xsl:copy-of select="$copyright"/>
        </body>
        </html>
        
        </xsl:template>
        <xsl:template match='api/error'>
        <xsl:value-of select="$error"/> <xsl:value-of select='@info'/>
        </xsl:template>
        
        </xsl:stylesheet>