tt-rss/tw/lang/TW_base.php

471 lines
12 KiB
PHP

<?php
/*
* tag|wall | PHP Tag Filter |
* ---------------------------------------------------------------------
Copyright (C) 2002 Juraj 'HVGE' Durech
Copyright (C) 2002 www.designia.sk
This program is free software; you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation; either version 2 of the License, or
(at your option) any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program; if not, write to the Free Software
Foundation, Inc., 59 Temple Place, Suite 330, Boston, MA 02111-1307 USA
* ---------------------------------------------------------------------
*/
/*
* $this->pt text
* $this->pti text index
*/
class TW_base // TW_lang extends this class
{
var $error; // error module object
var $output; // output module object
var $out; // output string
var $content_off;
var $tags; // relationships between tags
var $config; // current configuration (twParser::strip_tags())
var $config_tags; // tags in current configuration
var $config_attr; // attributes in current configuration
var $config_req_attr; // required attributes
var $TAG;
var $is_attributes;
var $ATTRIBUTES; // index => array("atr","value")
var $ATTR; // array(atr,value)
var $VALUE;
/********************************************************************************************
* BASE CONSTRUCTOR
*/
function TW_base()
{
global $tw_tag_relations;
$this->stack();
$this->tags = &$tw_tag_relations;
$this->content_off = 0;
}
/*
* BASE "DESTRUCTOR" (parser call this function if end of string is rached)
*/
function base_end()
{
while( $tag = $this->stack_pop() )
{
$this->out .= $this->output->close( $tag );
}
return null;
}
/********************************************************************************************
* TAG STACK implementation
*/
var $Tstack;
function stack() { $this->Tstack[0] = null; }
function stack_push( $tag ) { array_unshift( $this->Tstack, $tag ); }
function stack_pop() { return array_shift( $this->Tstack ); }
function stack_search( $tag ) { return in_array( $tag, $this->Tstack ); }
function stack_top( $tag = null )
{
if( $tag ) return $this->Tstack[0] == $tag;
return $this->Tstack[0];
}
/********************************************************************************************
* S T A R T _ T A G _ f i l t e r <tag atr=value>
*
*/
function START_TAG_filter()
{
$tag = $this->TAG;
if( $tag == null )
{
//###### syntax error
return;
}
if( in_array($tag,$this->config_tags) )
{
//enabled tag
if(is_string($this->config_attr[$tag]))
{
$this->TAG = $tag = $this->config_attr[$tag];
//tag substitution warning
}
// ------- perform attribute check -----------
if($this->is_attributes)
{
if(!$this->config_attr[$tag])
{
$this->ATTRIBUTES = null;
// remove attribute warning
}
else
{
foreach( $this->ATTRIBUTES as $key => $attr )
{
if( ! in_array($attr[0], $this->config_attr[$tag] ) )
{
$this->ATTRIBUTES[$key][1] = null;
// remove attribute warning
continue;
}
// --------- perform value check -----------
if(($val = $attr[1])==null) continue;
if(($cmda = &$this->config[$tag][$attr[0]])==null) continue; //null - accept all values
switch($cmda[0] & 7)
{
case TW_URL:
// V0.1.2: fixed some fatal bugs, big thanx to fczbkk
//
// TODO: make better url check with parse_url()
// $val = strtolower($val);
if(stripos($val, "http://") === false)
{
if(stripos($val, "ftp://") === false)
if(stripos($val, "email:") === false)
if(stripos($val, "https://") === false)
if(stripos($val, "./") === false) // local relative url
$val = "http://".$val;
}
$this->ATTRIBUTES[$key][1] = $val;
break;
case TW_LINK:
//TODO: add link separator check here.
// Do not use this attribute in config!
break;
case TW_NUM:
if( $val >= $cmda[2] && $val <= $cmda[3] ) break;
$this->ATTRIBUTES[$key][1] = $cmda[1];
break;
case TW_CASE:
if( !in_array($val, $cmda[2]) ) $this->ATTRIBUTES[$key][1] = $cmda[1];
break;
}
}
}
}
// check required attributes
if($this->config_req_attr[$tag])
{
if( $this->is_attributes )
foreach( $this->config_req_attr[$tag] as $required )
{
$req_found = 0;
foreach( $this->ATTRIBUTES as $val)
if( $val[0] == $required )
{
$req_found = 1;
break;
}
if($req_found) continue;
switch( $this->config[$tag][$required][0] & 7 )
{
case TW_LINK:
case TW_URL:
// error
break;
default:
$this->ATTRIBUTES[$required] = array($required, $this->config[$tag][$required][1]);
break;
}
}
else
{
foreach( $this->config_req_attr[$tag] as $required )
{
switch( $this->config[$tag][$required][0] & 7 )
{
case TW_LINK:
case TW_URL:
// required tag error
break;
default:
$this->ATTRIBUTES[$required] = array($required, $this->config[$tag][$required][1]);
break;
}
}
}
}
// cross tag removal algorithm
$flag = $this->tags[$tag];
$top = $this->stack_top();
if( $flag[2] != null ) // check if tag before is specified
{
// yes, tag before is specified, check relationship
if(! in_array($top, $flag[2]) )
{
if( $flag[0] & TW_OPT )
{
if( $top == $tag )
{
// End Tag is optional and current tag is the same as last tag (on stack).
// Close previos for XHTML compatibility and open new the same tag.
// Return, because no manipulation with stack is required.
$this->out .= $this->output->close( $tag );
$this->out .= $this->output->pair( $tag, $this->ATTRIBUTES );
return;
}
if( $this->stack_search($tag) )
{
// repair stack
while(($top = $this->stack_pop() ) != $tag )
{
/*if( !($this->tags[$top][0] & TW_OPT ) )
{
// auto close warning
}*/
$this->out .= $this->output->close( $top );
}
$this->stack_push($tag);
$this->out .= $this->output->close( $tag );
$this->out .= $this->output->pair( $tag, $this->ATTRIBUTES );
return;
}
}
// <th>...<td> =>> <th>...</th><td>... (<th> & <td> they have common parent tag (<tr>) )
if( $this->tags[$top][0] & TW_OPT )
{
if( $this->tags[$top][2] == $flag[2] )
{
$this->out .= $this->output->close( $this->stack_pop() );
$this->out .= $this->output->pair( $tag, $this->ATTRIBUTES );
$this->stack_push( $tag );
return;
}
}
// invalid relation between tags #######
return;
}
// valid relationship
}
if( $flag[0] & TW_NOP )
{
//tag without End Tag <br />
$this->out .= $this->output->single( $tag, $this->ATTRIBUTES );
}
else
{
//Tag with End Tag, push to stack
if( ($top == $tag) && ($flag[0] & TW_OPT) )
{
// '<p><p>' => '<p></p><p>'
$this->out .= $this->output->close( $tag );
$this->out .= $this->output->pair( $tag, $this->ATTRIBUTES );
return;
}
$this->out .= $this->output->pair( $tag, $this->ATTRIBUTES );
$this->stack_push( $tag );
}
return;
}
else
{
//disabled tag (or not supported) ######
return;
}
}
/********************************************************************************************
* E N D _ T A G _ f i l t e r </tag>
*
*/
function END_TAG_filter()
{
$tag = $this->TAG;
if( $tag == null )
{
// </>
if ($tag = $this->stack_pop() )
{
$this->out .= $this->output->close($tag);
return;
}
else
{
// kunda underflow :)
return;
}
}
if(in_array($tag,$this->config_tags))
{
// enabled tag
if(is_string($this->config_attr[$tag]))
{
$this->TAG = $tag = $this->config_attr[$tag];
//tag substitution warning
}
$top = $this->stack_top( $tag );
if( $top )
{
$this->out .= $this->output->close( $tag );
$this->stack_pop();
return;
}
if( $this->stack_search($tag) )
{
// closing cross tags
while( ($top = $this->stack_pop()) != $tag )
{
/*if( !($this->tags[$top][0] & TW_OPT ) )
{
// auto close warning
}*/
$this->out .= $this->output->close( $top );
}
$this->out .= $this->output->close( $tag );
}
else
{
// ###### cross tag error
return;
}
}
// drop out warning
}
/*
* THERE ARE STATE IN, OUT & NEW FUNCTIONS
*
*/
/********************************************************************************************
* STATE T_begin '<'
*/
function T_begin_in()
{
$this->tag_position = $this->pti;
$this->TAG = null;
}
// --- MAIN TAG-FILTER FUNCTION ---
function T_begin_out($word)
{
$this->START_TAG_filter();
}
/********************************************************************************************
* STATE TC_begin '</'
*/
function T_Cbegin_in()
{
$this->tag_position = $this->pti;
$this->TAG = null;
}
// TAG CLOSE function
//
function T_Cbegin_out($word)
{
$this->END_TAG_filter();
}
/********************************************************************************************
* STATE T_gettag 'tagname'
*/
function T_gettag_in()
{
$this->is_attributes = 0;
$this->ATTRIBUTES = null;
return;
}
function T_gettag_new($word) { $this->TAG = strtolower($word); }
function T_gettag_out($word) { return; }
/********************************************************************************************
* STATE A_begin '__atr...'
*/
function A_begin_in() { $this->ATTR = null; }
function A_begin_new($word) { $this->ATTR[0] = strtolower($word); }
function A_begin_out($word)
{
if( $this->is_attributes )
{
foreach( $this->ATTRIBUTES as $akey => $aval )
{
if($this->ATTR[0] == $aval[0])
{
// duplicate warning
$this->ATTRIBUTES[$akey] = $aval;
return;
}
}
}
else
{
$this->is_attributes = 1;
}
$this->ATTRIBUTES[] = $this->ATTR;
}
/********************************************************************************************
* STATE V_begin 'atr...'
*/
function V_begin_in() { $this->VALUE = null; }
function V_begin_out($word) { $this->ATTR[1] = $this->VALUE; }
/********************************************************************************************
* STATE VALUE1
*/
function VALUE1_in() { return; }
function VALUE1_out($word) { $this->VALUE = substr($word,0,strlen($word)-1); }
/********************************************************************************************
* STATE VALUE2
*/
function VALUE2_in() { return; }
function VALUE2_out($word)
{
$this->VALUE = str_replace("\"", "&#34", substr($word, 0, strlen($word)-1) );
}
/********************************************************************************************
* STATE VALUE3
*/
function VALUE3_in() { return; }
function VALUE3_out($word) { $this->VALUE = $word; }
} // END class TW_base
?>